Skip to content

Commit d8f2dac

Browse files
Merge pull request #8984 from Sesquipedalian/3.0/robots_txt_content_signals
[3.0] Implements the Content Signals extension of robots.txt
2 parents 4a63861 + acba55e commit d8f2dac

File tree

7 files changed

+219
-116
lines changed

7 files changed

+219
-116
lines changed

Languages/en_US/Admin.php

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -234,7 +234,7 @@
234234
$txt['admin_log_desc'] = 'Lists administrative tasks that have been performed by admins of your forum.';
235235
$txt['moderation_log'] = 'Moderation Log';
236236
$txt['moderation_log_desc'] = 'Lists moderation activities that have been performed by moderators on your forum.';
237-
$txt['spider_log_desc'] = 'Review the entries related to search engine spider activity on your forum.';
237+
$txt['spider_log_desc'] = 'Review the entries related to search engine and robot activity on your forum.';
238238
$txt['log_settings_desc'] = 'Use these options to configure how logging works on your forum.';
239239
$txt['modlog_enabled'] = 'Enable the moderation log';
240240
$txt['adminlog_enabled'] = 'Enable the administration log';
@@ -747,7 +747,7 @@
747747
$txt['admin_browse_register_new'] = 'Register new member';
748748

749749
$txt['search_engines'] = 'Search Engines';
750-
$txt['spider_logs'] = 'Spider Log';
750+
$txt['spider_logs'] = 'Robot Log';
751751
$txt['spider_stats'] = 'Stats';
752752

753753
$txt['paid_subscriptions'] = 'Paid Subscriptions';

Languages/en_US/General.php

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1103,15 +1103,15 @@
11031103
$txt['ignoring_user'] = 'You are ignoring this user.';
11041104
$txt['show_ignore_user_post'] = 'Show me the post.';
11051105

1106-
$txt['spider'] = 'Spider';
1107-
$txt['spiders'] = 'Spiders';
1106+
$txt['spider'] = 'Robot';
1107+
$txt['spiders'] = 'Robots';
11081108
$txt['spider_plural'] = '{0, plural,
1109-
one {spider}
1110-
other {spiders}
1109+
one {robot}
1110+
other {robots}
11111111
}';
11121112
$txt['number_of_spiders'] = '{0, plural,
1113-
one {# spider}
1114-
other {# spiders}
1113+
one {# robot}
1114+
other {# robots}
11151115
}';
11161116

11171117
$txt['downloads'] = 'Downloads';

Languages/en_US/Help.php

Lines changed: 14 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -565,28 +565,31 @@
565565
</ul>';
566566

567567
$helptxt['spider_mode'] = 'Sets the logging level.<br>
568-
Standard - Logs minimal spider activity.<br>
568+
Standard - Logs minimal robot activity.<br>
569569
Moderate - Provides more accurate statistics.<br>
570570
Aggressive - Same as &quot;Moderate&quot;, but logs data about each page visited.';
571571

572-
$helptxt['spider_group'] = 'By selecting a restrictive group, when a guest is detected as a search crawler it will automatically be assigned any &quot;deny&quot; permissions of this group in addition to the normal permissions of a guest. You can use this to provide lesser access to a search engine than you would a normal guest. You might for example wish to create a new group called &quot;Spiders&quot; and select that here. You could then deny permission for that group to view profiles to stop spiders indexing your members profiles.<br>Note: Spider detection is not perfect and can be simulated by users so this feature is not guaranteed to restrict content only to those search engines you have added.';
573-
$helptxt['show_spider_online'] = 'This setting allows you to select whether spiders should be listed in the &quot;Who’s Online&quot; list on the board index and &quot;Who’s Online&quot; page. The options are:
572+
$helptxt['spider_group'] = 'By selecting a restrictive group, when a guest is detected as a search crawler it will automatically be assigned any &quot;deny&quot; permissions of this group in addition to the normal permissions of a guest. You can use this to provide lesser access to a search engine than you would a normal guest. You might for example wish to create a new group called &quot;Robots&quot; and select that here. You could then deny permission for that group to view profiles to stop robots indexing your members profiles.<br>Note: Robot detection is not perfect and can be simulated by users so this feature is not guaranteed to restrict content only to those search engines you have added.';
573+
$helptxt['show_spider_online'] = 'This setting allows you to select whether robots should be listed in the &quot;Who’s Online&quot; list on the board index and &quot;Who’s Online&quot; page. The options are:
574574
<ul class="normallist">
575575
<li>
576576
<strong>Not at All</strong><br>
577-
Spiders will simply appear as guests to all users.
577+
Robots will simply appear as guests to all users.
578578
</li><li>
579-
<strong>Show Spider Quantity</strong><br>
580-
The Board Index will display the number of spiders currently visiting the forum.
579+
<strong>Show Robot Quantity</strong><br>
580+
The Board Index will display the number of robots currently visiting the forum.
581581
</li><li>
582-
<strong>Show Spider Names</strong><br>
583-
Each spider name will be revealed, so users can see how many of each spider is currently visiting the forum - this takes effect in both the Board Index and Who’s Online page.
582+
<strong>Show Robot Names</strong><br>
583+
Each robot name will be revealed, so users can see how many of each robot is currently visiting the forum - this takes effect in both the Board Index and Who’s Online page.
584584
</li><li>
585-
<strong>Show Spider Names - Admin Only</strong><br>
586-
As above except only Administrators can see spider status - to all other users spiders appear as guests.
585+
<strong>Show Robot Names - Admin Only</strong><br>
586+
As above except only Administrators can see robot status - to all other users robots appear as guests.
587587
</li>
588588
</ul>';
589-
$helptxt['robots_txt'] = 'The robots.txt file is used to implement the <a href="https://www.rfc-editor.org/rfc/rfc9309.html" class="bbc_link">Robots Exclusion Protocol</a>, a standard used by websites to indicate to search engine spiders and other web robots which portions of the website they are allowed to visit. This file is typically located in your website’s root directory.<br><br>SMF adds some rules to this file in order to guide spiders away from URLs that they should not bother to crawl. This improves efficiency and reduces server load when a spider is crawling your forum.';
589+
$helptxt['robots_txt'] = 'The robots.txt file is used to implement the <a href="https://www.rfc-editor.org/rfc/rfc9309.html" class="bbc_link">Robots Exclusion Protocol</a>, a standard used by websites to indicate to search engine spiders and other web robots which portions of the website they are allowed to visit. This file is typically located in your website’s root directory.<br><br>SMF adds some rules to this file in order to guide robots away from URLs that they should not bother to visit. This improves efficiency and reduces server load when a robot is indexing your forum.';
590+
$helptxt['robots_txt_search'] = 'This setting tells search engines whether they are permitted to show links to your forum in their search results. Most forums will want this enabled, but if you want your forum not to appear in search results, you can disable it.';
591+
$helptxt['robots_txt_ai_input'] = 'This setting tells search engines and other web robots whether they are permitted to use the content of your forum to generate AI summaries, etc. Unfortunately, there is no way to force search engines that index your site to obey these rules, but well-behaved ones will respect them.';
592+
$helptxt['robots_txt_ai_train'] = 'This setting tells artificial intelligence companies whether they are permitted to use the content of your forum to train their AI bots. Unfortunately, there is no way to force AI companies to obey these rules, but well-behaved ones will respect them.';
590593

591594
$helptxt['birthday_email'] = 'Choose the index of the birthday email message to use. A preview will be shown in the Email Subject and Email Body fields.<br><strong>Note:</strong> Selecting this setting does not automatically enable birthday emails. To enable birthday emails use the <a href="{scripturl}?action=admin;area=scheduledtasks;{session_var}={session_id}" target="_blank" rel="noopener">Scheduled Tasks</a> page and enable the birthday email task.';
592595
$helptxt['pm_bcc'] = 'When sending a personal message you can choose to add a recipient as BCC (Blind Carbon Copy). BCC recipients do not have their identities revealed to the other recipients of the message.';

Languages/en_US/Search.php

Lines changed: 24 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -124,44 +124,44 @@
124124
$txt['search_example'] = '<em>e.g.</em> Orwell "Animal Farm" -movie';
125125

126126
$txt['search_engines_description'] = 'From this area you can decide in what detail you wish to track search engines as they index your forum as well as review search engine logs.';
127-
$txt['spider_mode'] = 'Search Engine Tracking level';
128-
$txt['spider_mode_note'] = 'Note that logging of every spider action only occurs if tracking is set to either "moderate" or "aggressive". Detail of every spider’s action is only logged if tracking is set to "aggressive".';
127+
$txt['spider_mode'] = 'Search Engine and Robot Tracking level';
128+
$txt['spider_mode_note'] = 'Note that logging of every robot action only occurs if tracking is set to either "moderate" or "aggressive". Details about every robot action are only logged if tracking is set to "aggressive".';
129129
$txt['spider_mode_off'] = 'Disabled';
130130
$txt['spider_mode_standard'] = 'Standard';
131131
$txt['spider_mode_high'] = 'Moderate';
132132
$txt['spider_mode_vhigh'] = 'Aggressive';
133-
$txt['spider_settings_desc'] = 'You can change settings for spider tracking from this page. Note, if you wish to enable automatic pruning of the hit logs you can set this up <a href="%1$s">here</a>';
133+
$txt['spider_settings_desc'] = 'You can change settings for robot tracking from this page. Note, if you wish to enable automatic pruning of the hit logs you can set this up <a href="%1$s">here</a>';
134134

135135
$txt['spider_group'] = 'Apply restrictive permissions from group';
136-
$txt['spider_group_note'] = 'To enable you to stop spiders indexing some pages.';
136+
$txt['spider_group_note'] = 'To enable you to stop robots indexing some pages.';
137137
$txt['spider_group_none'] = 'Disabled';
138138

139-
$txt['show_spider_online'] = 'Show spiders in the online list';
139+
$txt['show_spider_online'] = 'Show robots in the online list';
140140
$txt['show_spider_online_no'] = 'Not at all';
141-
$txt['show_spider_online_summary'] = 'Show spider quantity';
142-
$txt['show_spider_online_detail'] = 'Show spider names';
143-
$txt['show_spider_online_detail_admin'] = 'Show spider names - admin only';
141+
$txt['show_spider_online_summary'] = 'Show robot quantity';
142+
$txt['show_spider_online_detail'] = 'Show robot names';
143+
$txt['show_spider_online_detail_admin'] = 'Show robot names - admin only';
144144

145-
$txt['spider_name'] = 'Spider Name';
145+
$txt['spider_name'] = 'Robot Name';
146146
$txt['spider_last_seen'] = 'Last Seen';
147147
$txt['spider_last_never'] = 'Never';
148148
$txt['spider_agent'] = 'User Agent';
149149
$txt['spider_ip_info'] = 'IP Addresses';
150-
$txt['spiders_add'] = 'Add new Spider';
151-
$txt['spiders_edit'] = 'Edit Spider';
150+
$txt['spiders_add'] = 'Add new robot';
151+
$txt['spiders_edit'] = 'Edit robot';
152152
$txt['spiders_remove_selected'] = 'Remove selected';
153-
$txt['spider_remove_selected_confirm'] = 'Are you sure you want to remove these spiders?-n-All associated statistics will also be deleted!';
154-
$txt['spiders_no_entries'] = 'There are currently no spiders configured.';
153+
$txt['spider_remove_selected_confirm'] = 'Are you sure you want to remove these robots?-n-All associated statistics will also be deleted!';
154+
$txt['spiders_no_entries'] = 'There are currently no robots configured.';
155155

156-
$txt['add_spider_desc'] = 'From this page you can edit the parameters against which a spider is categorized. If a guest’s user agent/IP address matches those entered below it will be detected as a search engine spider and tracked as per the forum preferences.';
157-
$txt['spider_name_desc'] = 'Name by which the spider will be referred.';
158-
$txt['spider_agent_desc'] = 'User agent associated with this spider.';
159-
$txt['spider_ip_info_desc'] = 'Comma separated list of IP addresses associated with this spider.';
156+
$txt['add_spider_desc'] = 'From this page you can edit the parameters against which a robot is categorized. If a guest’s user agent or IP address match those entered below, the guest will be detected as a robot and tracked as per the forum preferences.';
157+
$txt['spider_name_desc'] = 'Name by which the robot will be referred.';
158+
$txt['spider_agent_desc'] = 'User agent associated with this robot.';
159+
$txt['spider_ip_info_desc'] = 'Comma separated list of IP addresses associated with this robot.';
160160

161161
$txt['spider_time'] = 'Time';
162162
$txt['spider_viewing'] = 'Viewing';
163-
$txt['spider_logs_empty'] = 'There are currently no spider log entries.';
164-
$txt['spider_logs_info'] = 'Note that logging of every spider action only occurs if tracking is set to either "moderate" or "aggressive". Detail of every spider’s action is only logged if tracking is set to "aggressive".';
163+
$txt['spider_logs_empty'] = 'There are currently no robot log entries.';
164+
$txt['spider_logs_info'] = 'Note that logging of every robot action only occurs if tracking is set to either "moderate" or "aggressive". Details about every robot action are only logged if tracking is set to "aggressive".';
165165
$txt['spider_disabled'] = 'Disabled';
166166
$txt['spider_log_empty_log'] = 'Clear Log';
167167
$txt['spider_log_empty_log_confirm'] = 'Are you sure you want to completely clear the log';
@@ -172,19 +172,22 @@
172172
$txt['spider_logs_delete_submit'] = 'Delete';
173173

174174
// argument: an HTML <input> element.
175-
$txt['spider_stats_delete_older'] = 'Delete all spider statistics from spiders not seen in {input} days.';
175+
$txt['spider_stats_delete_older'] = 'Delete all statistics from robots not seen in {input} days.';
176176

177177
// Don't use entities in the below string.
178178
$txt['spider_logs_delete_confirm'] = 'Are you sure you wish to empty out all log entries?';
179179

180180
$txt['spider_stats_select_month'] = 'Jump to Month';
181181
$txt['spider_stats_page_hits'] = 'Page Hits';
182-
$txt['spider_stats_no_entries'] = 'There are currently no spider statistics available.';
182+
$txt['spider_stats_no_entries'] = 'There are currently no robot statistics available.';
183183

184184
$txt['robots_txt'] = 'Add SMF rules to robots.txt';
185185
$txt['robots_txt_info'] = 'Enter the path to your robots.txt file so that SMF can append rules to it.';
186186
$txt['robots_txt_auto'] = 'Detect path';
187187
$txt['robots_txt_not_writable'] = 'The robots.txt file is not writable.';
188+
$txt['robots_txt_search'] = 'Allow search engines to link to the forum in their search results';
189+
$txt['robots_txt_ai_input'] = 'Allow search engines to generate AI summaries of forum content';
190+
$txt['robots_txt_ai_train'] = 'Allow forum content to be used for AI training';
188191

189192
$txt['meta_keywords'] = 'Meta keywords associated with forum';
190193
$txt['meta_keywords_note'] = 'In most situations, this should be left blank.';

Languages/en_US/Who.php

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,9 @@
1313
$txt['who_show'] = 'Show ';
1414
$txt['who_show_members_only'] = 'Members only';
1515
$txt['who_show_guests_only'] = 'Guests only';
16-
$txt['who_show_spiders_only'] = 'Spiders only';
16+
$txt['who_show_spiders_only'] = 'Robots only';
1717
$txt['who_show_all'] = 'Everyone';
18-
$txt['who_no_online_spiders'] = 'There are currently no spiders online.';
18+
$txt['who_no_online_spiders'] = 'There are currently no robots online.';
1919
$txt['who_no_online_guests'] = 'There are currently no guests online.';
2020
$txt['who_no_online_members'] = 'There are currently no members online.';
2121
$txt['who_guest_login'] = 'User has been taken to the login page.';

0 commit comments

Comments
 (0)