sherlock-project · shreyasNaik0101 · Oct 3, 2025 · Oct 6, 2025 · Oct 6, 2025 · Oct 6, 2025
diff --git a/.actor/dataset_schema.json b/.actor/dataset_schema.json
@@ -29,7 +29,7 @@
               "fields": [
                 "username",
                 "links"
-              ],
+              ]
             },
             "display": {
                "component": "table",

diff --git a/sherlock_project/resources/data.json b/sherlock_project/resources/data.json
@@ -2263,11 +2263,11 @@
       "<div class=\"error-panel\"><span>User ",
       "<title>429 Too Many Requests</title>"
     ],
+    "aliases": ["X"],
     "errorType": "message",
     "regexCheck": "^[a-zA-Z0-9_]{1,15}$",
     "url": "https://x.com/{}",
     "urlMain": "https://x.com/",
-    "urlProbe": "https://nitter.privacydev.net/{}",
     "username_claimed": "blue"
   },
   "Typeracer": {

diff --git a/sherlock_project/resources/data.schema.json b/sherlock_project/resources/data.schema.json
@@ -1,149 +1,154 @@
 {
-  "$schema": "https://json-schema.org/draft/2020-12/schema",
-  "title": "Sherlock Target Manifest",
-  "description": "Social media targets to probe for the existence of known usernames",
-  "type": "object",
-  "properties": {
-    "$schema": { "type": "string" }
-  },
-  "patternProperties": {
-    "^(?!\\$).*?$": {
-      "type": "object",
-      "description": "Target name and associated information (key should be human readable name)",
-      "required": ["url", "urlMain", "errorType", "username_claimed"],
-      "properties": {
-        "url": { "type": "string" },
-        "urlMain": { "type": "string" },
-        "urlProbe": { "type": "string" },
-        "username_claimed": { "type": "string" },
-        "regexCheck": { "type": "string" },
-        "isNSFW": { "type": "boolean" },
-        "headers": { "type": "object" },
-        "request_payload": { "type": "object" },
-        "__comment__": {
-          "type": "string",
-          "description": "Used to clarify important target information if (and only if) a commit message would not suffice.\nThis key should not be parsed anywhere within Sherlock."
-        },
-        "tags": {
-          "oneOf": [
-            { "$ref": "#/$defs/tag" },
-            { "type": "array", "items": { "$ref": "#/$defs/tag" } }
-          ]
-        },
-        "request_method": {
-          "type": "string",
-          "enum": ["GET", "POST", "HEAD", "PUT"]
-        },
-        "errorType": {
-          "oneOf": [
-            {
-              "type": "string",
-              "enum": ["message", "response_url", "status_code"]
-            },
-            {
-              "type": "array",
-              "items": {
-                "type": "string",
-                "enum": ["message", "response_url", "status_code"]
-              }
-            }
-          ]
-        },
-        "errorMsg": {
-          "oneOf": [
-            { "type": "string" },
-            { "type": "array", "items": { "type": "string" } }
-          ]
-        },
-        "errorCode": {
-          "oneOf": [
-            { "type": "integer" },
-            { "type": "array", "items": { "type": "integer" } }
-          ]
-        },
-        "errorUrl": { "type": "string" },
-        "response_url": { "type": "string" }
-      },
-      "dependencies": {
-        "errorMsg": {
-          "oneOf": [
-            { "properties": { "errorType": { "const": "message" } } },
-            {
-              "properties": {
-                "errorType": {
-                  "type": "array",
-                  "contains": { "const": "message" }
-                }
-              }
-            }
-          ]
-        },
-        "errorUrl": {
-          "oneOf": [
-            { "properties": { "errorType": { "const": "response_url" } } },
-            {
-              "properties": {
+    "$schema": "https://json-schema.org/draft/2020-12/schema",
+    "title": "Sherlock Target Manifest",
+    "description": "Social media targets to probe for the existence of known usernames",
+    "type": "object",
+    "properties": {
+        "$schema": { "type": "string" }
+    },
+    "patternProperties": {
+        "^(?!\\$).*?$": {
+            "type": "object",
+            "description": "Target name and associated information (key should be human readable name)",
+            "required": ["url", "urlMain", "errorType", "username_claimed"],
+            "properties": {
+                "url": { "type": "string" },
+                "urlMain": { "type": "string" },
+                "urlProbe": { "type": "string" },
+                "username_claimed": { "type": "string" },
+                "username_unclaimed": { "type": "string" },
+                "regexCheck": { "type": "string" },
+                "isNSFW": { "type": "boolean" },
+                "headers": { "type": "object" },
+                "request_payload": { "type": "object" },
+                "__comment__": {
+                    "type": "string",
+                    "description": "Used to clarify important target information if (and only if) a commit message would not suffice.\nThis key should not be parsed anywhere within Sherlock."
+                },
+                "tags": {
+                    "oneOf": [
+                        { "$ref": "#/$defs/tag" },
+                        { "type": "array", "items": { "$ref": "#/$defs/tag" } }
+                    ]
+                },
+                "request_method": {
+                    "type": "string",
+                    "enum": ["GET", "POST", "HEAD", "PUT"]
+                },
                 "errorType": {
-                  "type": "array",
-                  "contains": { "const": "response_url" }
-                }
-              }
-            }
-          ]
-        },
-        "errorCode": {
-          "oneOf": [
-            { "properties": { "errorType": { "const": "status_code" } } },
-            {
-              "properties": {
-                "errorType": {
-                  "type": "array",
-                  "contains": { "const": "status_code" }
-                }
-              }
-            }
-          ]
-        }
-      },
-      "allOf": [
-        {
-          "if": {
-            "anyOf": [
-              { "properties": { "errorType": { "const": "message" } } },
-              {
-                "properties": {
-                  "errorType": {
+                    "oneOf": [
+                        {
+                            "type": "string",
+                            "enum": ["message", "response_url", "status_code"]
+                        },
+                        {
+                            "type": "array",
+                            "items": {
+                                "type": "string",
+                                "enum": ["message", "response_url", "status_code"]
+                            }
+                        }
+                    ]
+                },
+                "errorMsg": {
+                    "oneOf": [
+                        { "type": "string" },
+                        { "type": "array", "items": { "type": "string" } }
+                    ]
+                },
+                "errorCode": {
+                    "oneOf": [
+                        { "type": "integer" },
+                        { "type": "array", "items": { "type": "integer" } }
+                    ]
+                },
+                "errorUrl": { "type": "string" },
+                "response_url": { "type": "string" },
+                "aliases": {
                     "type": "array",
-                    "contains": { "const": "message" }
-                  }
+                    "items": { "type": "string" }
                 }
-              }
-            ]
-          },
-          "then": { "required": ["errorMsg"] }
-        },
-        {
-          "if": {
-            "anyOf": [
-              { "properties": { "errorType": { "const": "response_url" } } },
-              {
-                "properties": {
-                  "errorType": {
-                    "type": "array",
-                    "contains": { "const": "response_url" }
-                  }
+            },
+            "dependencies": {
+                "errorMsg": {
+                    "oneOf": [
+                        { "properties": { "errorType": { "const": "message" } } },
+                        {
+                            "properties": {
+                                "errorType": {
+                                    "type": "array",
+                                    "contains": { "const": "message" }
+                                }
+                            }
+                        }
+                    ]
+                },
+                "errorUrl": {
+                    "oneOf": [
+                        { "properties": { "errorType": { "const": "response_url" } } },
+                        {
+                            "properties": {
+                                "errorType": {
+                                    "type": "array",
+                                    "contains": { "const": "response_url" }
+                                }
+                            }
+                        }
+                    ]
+                },
+                "errorCode": {
+                    "oneOf": [
+                        { "properties": { "errorType": { "const": "status_code" } } },
+                        {
+                            "properties": {
+                                "errorType": {
+                                    "type": "array",
+                                    "contains": { "const": "status_code" }
+                                }
+                            }
+                        }
+                    ]
+                }
+            },
+            "allOf": [
+                {
+                    "if": {
+                        "anyOf": [
+                            { "properties": { "errorType": { "const": "message" } } },
+                            {
+                                "properties": {
+                                    "errorType": {
+                                        "type": "array",
+                                        "contains": { "const": "message" }
+                                    }
+                                }
+                            }
+                        ]
+                    },
+                    "then": { "required": ["errorMsg"] }
+                },
+                {
+                    "if": {
+                        "anyOf": [
+                            { "properties": { "errorType": { "const": "response_url" } } },
+                            {
+                                "properties": {
+                                    "errorType": {
+                                        "type": "array",
+                                        "contains": { "const": "response_url" }
+                                    }
+                                }
+                            }
+                        ]
+                    },
+                    "then": { "required": ["errorUrl"] }
                 }
-              }
-            ]
-          },
-          "then": { "required": ["errorUrl"] }
+            ],
+            "additionalProperties": false
         }
-      ],
-      "additionalProperties": false
+    },
+    "additionalProperties": false,
+    "$defs": {
+        "tag": { "type": "string", "enum": ["adult", "gaming"] }
     }
-  },
-  "additionalProperties": false,
-  "$defs": {
-    "tag": { "type": "string", "enum": ["adult", "gaming"] }
-  }
-}
+}
diff --git a/sherlock_project/sherlock.py b/sherlock_project/sherlock.py
@@ -779,6 +779,10 @@ def main():
     if not args.nsfw:
         sites.remove_nsfw_sites(do_not_remove=args.site_list)
 
+    # Create original dictionary from SitesInformation() object.
+    # Eventually, the rest of the code will be updated to use the new object
+    # directly, but this will glue the two pieces together.
+    site_data_all = {site.name: site.information for site in sites}
     # Create original dictionary from SitesInformation() object.
     # Eventually, the rest of the code will be updated to use the new object
     # directly, but this will glue the two pieces together.
@@ -791,15 +795,25 @@ def main():
         # Make sure that the sites are supported & build up pruned site database.
         site_data = {}
         site_missing = []
-        for site in args.site_list:
-            counter = 0
-            for existing_site in site_data_all:
-                if site.lower() == existing_site.lower():
-                    site_data[existing_site] = site_data_all[existing_site]
-                    counter += 1
-            if counter == 0:
-                # Build up list of sites not supported for future error message.
-                site_missing.append(f"'{site}'")
+
+        # Create a mapping from all site names and aliases (in lowercase) to their proper names
+        site_map = {}
+        for site_name, site_info in site_data_all.items():
+            site_map[site_name.lower()] = site_name
+            if "aliases" in site_info:
+                for alias in site_info["aliases"]:
+                    site_map[alias.lower()] = site_name
+
+        for site_name_from_user in args.site_list:
+            # Find the proper site name from the user's input (which could be an alias)
+            proper_site_name = site_map.get(site_name_from_user.lower())
+
+            if proper_site_name:
+                # If a match was found, add the site's data to our list
+                site_data[proper_site_name] = site_data_all[proper_site_name]
+            else:
+                # If no match was found for the name or any alias
+                site_missing.append(f"'{site_name_from_user}'")
 
         if site_missing:
             print(f"Error: Desired sites not found: {', '.join(site_missing)}.")