From b5302f43afb87d7dbbbe7006b24e9306884edd6e Mon Sep 17 00:00:00 2001 From: Max Ostapenko <1611259+max-ostapenko@users.noreply.github.com> Date: Sun, 1 Mar 2026 18:28:42 +0100 Subject: [PATCH 1/3] Refactor SQL files to remove unnecessary #standardSQL comments --- sql/2025/accessibility/a11y_frontend_technology.sql | 1 - .../accessibility/a11y_overall_tech_usage_by_domain_rank.sql | 1 - sql/2025/accessibility/a11y_technology_usage.sql | 1 - sql/2025/accessibility/a11y_technology_usage_by_domain_rank.sql | 1 - sql/2025/accessibility/alt_ending_in_image_extension.sql | 1 - sql/2025/accessibility/anchors_with_role_button.sql | 1 - sql/2025/accessibility/button_name_sources.sql | 1 - sql/2025/accessibility/color_contrast.sql | 1 - sql/2025/accessibility/common_alt_text_length.sql | 1 - sql/2025/accessibility/common_aria_role.sql | 1 - sql/2025/accessibility/common_element_attributes.sql | 1 - sql/2025/accessibility/focus_outline_0.sql | 1 - sql/2025/accessibility/focus_visible.sql | 1 - sql/2025/accessibility/lighthouse_a11y_audits.sql | 1 - sql/2025/accessibility/lighthouse_a11y_audits_by_cms.sql | 1 - sql/2025/accessibility/lighthouse_a11y_score.sql | 1 - sql/2025/accessibility/lighthouse_score_by_cms.sql | 1 - sql/2025/accessibility/lighthouse_score_by_country.sql | 1 - sql/2025/accessibility/lighthouse_score_by_tld.sql | 1 - sql/2025/accessibility/media_query_features.sql | 1 - sql/2025/accessibility/page_title.sql | 1 - sql/2025/accessibility/pages_with_search_input.sql | 1 - sql/2025/accessibility/placeholder_but_no_label.sql | 1 - sql/2025/accessibility/sites_using_role.sql | 1 - sql/2025/accessibility/skip_links.sql | 1 - sql/2025/accessibility/sr_only_classes.sql | 1 - sql/2025/accessibility/tabindex_usage_and_values.sql | 1 - sql/2025/accessibility/table_stats.sql | 1 - sql/2025/accessibility/units_properties.sql | 1 - sql/2025/accessibility/valid_html_lang.sql | 1 - sql/2025/accessibility/video_track_usage.sql | 1 - sql/2025/accessibility/viewport_zoom_scale.sql | 1 - sql/2025/accessibility/viewport_zoom_scale_by_domain_rank.sql | 1 - sql/2025/capabilities/fugu.sql | 1 - sql/2025/capabilities/top.sql | 1 - sql/2025/cdn/alt_svc_protocol_analysis.sql | 1 - sql/2025/cdn/brotli_compression_adoption.sql | 1 - sql/2025/cdn/cache_control_analysis.sql | 1 - sql/2025/cdn/cdn_security_features_adoption.sql | 1 - sql/2025/cdn/cdn_usage_by_site_rank.sql | 1 - sql/2025/cdn/client_hints/baseline.sql | 1 - sql/2025/cdn/client_hints/client_hints_by_cdn.sql | 1 - sql/2025/cdn/client_hints/client_hints_by_header.sql | 1 - sql/2025/cdn/client_hints/client_hints_cdn_vs_origin.sql | 1 - sql/2025/cdn/client_hints/default_vs_requested_hints.sql | 1 - sql/2025/cdn/distribution_of_compression_types_by_cdn.sql | 1 - .../cdn/distribution_of_compression_types_cdn_vs_origin.sql | 1 - sql/2025/cdn/distribution_of_http_versions.sql | 1 - sql/2025/cdn/distribution_of_http_versions_cdn_vs_origin.sql | 1 - sql/2025/cdn/distribution_of_tls_time_by_cdn.sql | 1 - sql/2025/cdn/distribution_of_tls_time_cdn_vs_origin.sql | 1 - sql/2025/cdn/distribution_of_tls_versions.sql | 1 - sql/2025/cdn/distribution_of_tls_versions_cdn_vs_origin.sql | 1 - sql/2025/cdn/early_hints/baseline.sql | 1 - sql/2025/cdn/early_hints/early_hints_by_cdn.sql | 1 - sql/2025/cdn/early_hints/early_hints_cdn_vs_origin.sql | 1 - sql/2025/cdn/early_hints/preload_patterns.sql | 1 - sql/2025/cdn/early_hints/resource_types_preloaded.sql | 1 - sql/2025/cdn/h3_adoption_by_cdn_provider.sql | 1 - sql/2025/cdn/h3_adoption_by_cdn_vs_origin.sql | 1 - sql/2025/cdn/http3_performance_impact.sql | 1 - sql/2025/cdn/security_headers_by_cdn.sql | 1 - sql/2025/cdn/server_timing_adoption.sql | 1 - sql/2025/cdn/top_cdns.sql | 1 - sql/2025/cdn/top_cdns_by_rank.sql | 1 - sql/2025/cdn/usage_of_content_cdns.sql | 1 - sql/2025/cms/cms_adoption.sql | 1 - sql/2025/cms/cms_adoption_by_geo.sql | 1 - sql/2025/cms/cms_adoption_by_rank_all.sql | 1 - sql/2025/cms/cms_adoption_by_region.sql | 1 - sql/2025/cms/cms_adoption_by_subregion.sql | 1 - sql/2025/cms/image_format_popularity.sql | 1 - sql/2025/cms/lighthouse_category_scores_per_cms.sql | 1 - sql/2025/cms/lighthouse_category_scores_per_cms_yoy.sql | 1 - sql/2025/cms/page_weight_distribution.sql | 1 - sql/2025/cms/resource_weights.sql | 1 - sql/2025/cms/top_cms.sql | 1 - sql/2025/cms/top_cms_by_geo.sql | 1 - sql/2025/cms/top_cms_by_rank.sql | 1 - sql/2025/cms/wordpress_page_builders.sql | 1 - sql/2025/cms/wordpress_resources.sql | 1 - sql/2025/generative-ai/ai_tld.sql | 1 - sql/2025/generative-ai/gradient-client-rank.sql | 2 -- sql/2025/generative-ai/gradient-use.sql | 1 - sql/2025/generative-ai/gradient.sql | 1 - sql/2025/generative-ai/sites-with-robot-txt.sql | 1 - sql/2025/generative-ai/user-agent-named.sql | 1 - sql/2025/generative-ai/user-agent-years.sql | 1 - sql/2025/generative-ai/vibecodetools.sql | 1 - sql/2025/performance/early_hints_usage_rank.sql | 1 - sql/2025/performance/early_hints_usage_trends.sql | 1 - sql/2025/performance/generated_content.sql | 1 - sql/2025/performance/generated_content_web_vitals.sql | 1 - sql/2025/pwa/assetlink_usage.sql | 1 - sql/2025/pwa/fugu.sql | 1 - sql/2025/pwa/manifest_categories.sql | 1 - sql/2025/pwa/manifest_display_values.sql | 1 - sql/2025/pwa/manifest_icon_sizes.sql | 1 - sql/2025/pwa/manifest_orientations.sql | 1 - sql/2025/pwa/manifest_properties.sql | 1 - sql/2025/pwa/manifests_and_service_workers.sql | 1 - sql/2025/pwa/manifests_description.sql | 1 - sql/2025/pwa/manifests_file_handlers.sql | 1 - sql/2025/pwa/manifests_iarc.sql | 1 - sql/2025/pwa/manifests_lang.sql | 1 - sql/2025/pwa/manifests_not_json_parsable.sql | 1 - sql/2025/pwa/manifests_note_taking.sql | 1 - sql/2025/pwa/manifests_preferring_native_apps.sql | 1 - sql/2025/pwa/manifests_protocol_handlers.sql | 1 - sql/2025/pwa/manifests_screenshots.sql | 1 - sql/2025/pwa/manifests_screenshots_platform_narrow.sql | 1 - sql/2025/pwa/manifests_screenshots_platform_wide.sql | 1 - sql/2025/pwa/manifests_share_target.sql | 1 - sql/2025/pwa/manifests_shortcuts.sql | 1 - sql/2025/pwa/manifests_window_controls_overlay.sql | 1 - sql/2025/pwa/popular_pwa_libraries.sql | 1 - sql/2025/pwa/popular_pwa_libraries_helper.sql | 1 - sql/2025/pwa/pwa_blink_usage.sql | 1 - sql/2025/pwa/pwa_notification_acceptance_rates.sql | 1 - sql/2025/pwa/pwa_notification_acceptance_rates_over_time.sql | 1 - sql/2025/pwa/sw_adoption_over_time.sql | 1 - sql/2025/pwa/sw_adoption_over_time_ranking.sql | 1 - sql/2025/pwa/sw_events.sql | 1 - sql/2025/pwa/sw_methods.sql | 1 - sql/2025/pwa/sw_objects.sql | 1 - sql/2025/pwa/sw_objects_name_only.sql | 1 - sql/2025/pwa/sw_registration_properties.sql | 1 - sql/2025/pwa/sw_registration_properties_name_only.sql | 1 - sql/2025/pwa/workbox_methods.sql | 1 - sql/2025/pwa/workbox_packages.sql | 1 - sql/2025/pwa/workbox_usage.sql | 1 - sql/2025/pwa/workbox_versions.sql | 1 - sql/2025/security/audit_issues.sql | 1 - sql/2025/security/bot_detection.sql | 1 - sql/2025/security/clear-site-data_value_prevalence.sql | 1 - sql/2025/security/coep_header_prevalence.sql | 1 - sql/2025/security/cookie_age_negative.sql | 1 - sql/2025/security/cookie_age_percentiles.sql | 1 - sql/2025/security/cookie_attributes.sql | 1 - sql/2025/security/cookie_max_age_expires_top_values.sql | 1 - sql/2025/security/coop_header_prevalence.sql | 1 - sql/2025/security/corp_header_prevalence.sql | 1 - sql/2025/security/cryptominer_share.sql | 1 - sql/2025/security/cryptominer_usage.sql | 1 - sql/2025/security/csp_allowed_host_frequency.sql | 1 - sql/2025/security/csp_allowed_host_frequency_wss.sql | 1 - sql/2025/security/csp_directives_usage.sql | 1 - sql/2025/security/csp_features.sql | 1 - sql/2025/security/csp_most_common_header.sql | 1 - sql/2025/security/csp_number_of_allowed_hosts.sql | 1 - .../security/csp_script_source_list_keywords_per_header.sql | 1 - .../security/csp_script_source_list_keywords_per_request.sql | 1 - sql/2025/security/documentdomain_usage.sql | 1 - sql/2025/security/documentpolicy_most_common_header.sql | 1 - sql/2025/security/feature_adoption_by_category.sql | 1 - sql/2025/security/feature_adoption_by_country.sql | 1 - sql/2025/security/feature_adoption_by_other_features.sql | 1 - sql/2025/security/feature_adoption_by_technology.sql | 1 - sql/2025/security/fp_header_prevalence.sql | 1 - sql/2025/security/home_page_https_usage.sql | 1 - sql/2025/security/hsts_attributes.sql | 1 - sql/2025/security/hsts_max_age_percentiles.sql | 1 - sql/2025/security/html_sanitization_usage.sql | 1 - sql/2025/security/https_request_over_time.sql | 1 - sql/2025/security/https_server_redirects.sql | 1 - sql/2025/security/iframe_allow_directive_values.sql | 1 - sql/2025/security/iframe_allow_directives.sql | 1 - sql/2025/security/iframe_attribute_popular_hosts.sql | 1 - sql/2025/security/iframe_attributes_usage.sql | 1 - sql/2025/security/iframe_attributes_usage_fix.sql | 1 - sql/2025/security/iframe_sandbox_directives.sql | 1 - sql/2025/security/meta_csp_disallowed_directives.sql | 1 - sql/2025/security/meta_policies_allowed_vs_disallowed.sql | 1 - sql/2025/security/mimetype_file_extension_mismatch.sql | 1 - sql/2025/security/mixed_content.sql | 1 - sql/2025/security/oac_header_prevalence.sql | 1 - sql/2025/security/pp_header_prevalence.sql | 1 - sql/2025/security/robot_header_and_meta_tag_prevalence.sql | 1 - sql/2025/security/robot_txt_sensitive_disallow.sql | 1 - sql/2025/security/security_adoption_by_category.sql | 1 - sql/2025/security/security_adoption_by_rank.sql | 1 - sql/2025/security/security_headers_prevalence.sql | 1 - sql/2025/security/server_header_value_prevalence.sql | 1 - sql/2025/security/server_information_header_prevalence.sql | 1 - sql/2025/security/server_timing_usage_values.sql | 1 - sql/2025/security/sri_coverage_per_page.sql | 1 - sql/2025/security/sri_hash_functions.sql | 1 - sql/2025/security/sri_popular_hosts.sql | 1 - sql/2025/security/sri_usage.sql | 1 - sql/2025/security/tao_header_prevalence.sql | 1 - sql/2025/security/tls_ca_expired_cert.sql | 1 - sql/2025/security/tls_ca_issuers_pages.sql | 1 - sql/2025/security/tls_ca_issuers_pages_over_time.sql | 1 - sql/2025/security/tls_ca_issuers_requests.sql | 1 - sql/2025/security/tls_cipher_suite.sql | 1 - sql/2025/security/tls_forward_secrecy.sql | 1 - sql/2025/security/tls_versions_pages.sql | 1 - sql/2025/security/tls_versions_requests.sql | 1 - sql/2025/security/version-evolution-top-technologies.sql | 1 - sql/2025/security/web_cryptography_api.sql | 1 - sql/2025/security/well-known_change-password.sql | 1 - sql/2025/security/well-known_resource-not-be-200.sql | 1 - sql/2025/security/well-known_security.sql | 1 - sql/2025/security/xfo_header_prevalence.sql | 1 - sql/2025/seo/anchor-rel-attribute-usage-2025.sql | 1 - sql/2025/seo/anchor-same-site-occurance-stats-2025.sql | 1 - sql/2025/seo/content-language-2025.sql | 1 - sql/2025/seo/fixed-anchor-same-site-occurance-stats-2025.sql | 1 - sql/2025/seo/hreflang-header-usage-2025.sql | 1 - sql/2025/seo/hreflang-link-tag-usage-2025.sql | 1 - sql/2025/seo/iframe-loading-property-usage-2025.sql | 1 - sql/2025/seo/image-alt-stats-2025.sql | 1 - sql/2025/seo/invalid-head-elements-2025.sql | 1 - sql/2025/seo/invalid-head-sites-2025.sql | 2 -- sql/2025/seo/lighthouse-seo-stats-2025.sql | 1 - sql/2025/seo/llms-status-2025.sql | 1 - sql/2025/seo/llms-txt-errors-2025.sql | 1 - sql/2025/seo/mark-up-stats-2025.sql | 1 - .../seo/media-property-usage-link-tags-rel-alternate-2025.sql | 1 - sql/2025/seo/meta-tag-usage-by-name-2025.sql | 1 - sql/2025/seo/meta-tag-usage-by-property-2025.sql | 1 - sql/2025/seo/outgoing_links_by_rank-2025.sql | 1 - sql/2025/seo/pages-canonical-stats-2025.sql | 1 - sql/2025/seo/pages-containing-a-video-element-2025.sql | 1 - sql/2025/seo/robots-meta-usage-2025.sql | 1 - sql/2025/seo/robots-text-size-2025.sql | 1 - sql/2025/seo/robots-txt-size-2025.sql | 1 - sql/2025/seo/robots-txt-status-codes -2025.sql | 1 - sql/2025/seo/robots-txt-user-agent-usage-2025.sql | 1 - sql/2025/seo/root-pages-valid-llms-2025.sql | 1 - sql/2025/seo/seo-stats-2025.sql | 1 - sql/2025/seo/seo-stats-by-percentile-2025.sql | 1 - sql/2025/seo/structured-data-formats-2025.sql | 1 - sql/2025/seo/structured-data-schema-types-2025.sql | 1 - sql/2025/seo/test-invalid-head-sites.sql | 1 - sql/2025/seo/unused-css-js-2025.sql | 1 - sql/2025/sustainability/cache_header_usage.sql | 1 - sql/2025/sustainability/cdn_adoption.sql | 1 - sql/2025/sustainability/cms_bytes_per_type.sql | 1 - sql/2025/sustainability/content-visibility.sql | 1 - sql/2025/sustainability/ecommerce_bytes_per_type.sql | 1 - sql/2025/sustainability/favicons.sql | 1 - sql/2025/sustainability/global_emissions_per_page.sql | 1 - sql/2025/sustainability/green_third_party_requests.sql | 1 - sql/2025/sustainability/page_byte_pre_type.sql | 1 - sql/2025/sustainability/responsive_images.sql | 1 - sql/2025/sustainability/script_count.sql | 1 - sql/2025/sustainability/ssg_bytes_per_type.sql | 1 - sql/2025/sustainability/stylesheet_count.sql | 1 - sql/2025/sustainability/unminified_css_bytes.sql | 1 - sql/2025/sustainability/unminified_js_bytes.sql | 1 - sql/2025/sustainability/unused_css_bytes.sql | 1 - sql/2025/sustainability/unused_js_bytes.sql | 1 - sql/2025/sustainability/use_of_prefers_dark_mode_usage.sql | 1 - sql/2025/third-parties/consent_signal_basic_analysis.sql | 1 - .../consent_signal_prevalence_by_third_party_category.sql | 1 - .../consent_signal_survival_rate_through_chains.sql | 1 - .../consent_signal_survival_rate_through_redirects.sql | 1 - .../consent_signals_by_parameter_and_domain_optimized.sql | 1 - .../distribution_of_websites_by_number_of_third_parties.sql | 1 - sql/2025/third-parties/number_of_third_parties_by_rank.sql | 1 - .../number_of_third_parties_by_rank_and_category.sql | 1 - .../number_of_third_party_providers_by_rank_and_category.sql | 1 - .../third-parties/number_of_third_party_requests_by_rank.sql | 1 - .../number_of_third_party_requests_per_page_by_rank.sql | 1 - .../third-parties/percent_of_third_parties_by_content_type.sql | 1 - .../percent_of_websites_with_third_party_by_ranking.sql | 1 - ...nce_of_consent_signals_in_third_party_requests_optimized.sql | 1 - .../top100_third_parties_by_number_of_websites.sql | 1 - 269 files changed, 271 deletions(-) diff --git a/sql/2025/accessibility/a11y_frontend_technology.sql b/sql/2025/accessibility/a11y_frontend_technology.sql index ba2cb7bd121..f9d42994fa8 100644 --- a/sql/2025/accessibility/a11y_frontend_technology.sql +++ b/sql/2025/accessibility/a11y_frontend_technology.sql @@ -1,4 +1,3 @@ -#standardSQL -- Web Almanac — Lighthouse category scores by framework (2025-07-01) -- Google Sheet: a11y_frontend_technology -- diff --git a/sql/2025/accessibility/a11y_overall_tech_usage_by_domain_rank.sql b/sql/2025/accessibility/a11y_overall_tech_usage_by_domain_rank.sql index 049d5b8d8fe..3f078f8049f 100644 --- a/sql/2025/accessibility/a11y_overall_tech_usage_by_domain_rank.sql +++ b/sql/2025/accessibility/a11y_overall_tech_usage_by_domain_rank.sql @@ -1,4 +1,3 @@ -#standardSQL -- Accessibility Technology (A11y) Usage by Domain Rank (2025-07-01) -- Google Sheet: a11y_overall_tech_usage_by_domain_rank -- diff --git a/sql/2025/accessibility/a11y_technology_usage.sql b/sql/2025/accessibility/a11y_technology_usage.sql index fd0d43c5809..6afe2de72b6 100644 --- a/sql/2025/accessibility/a11y_technology_usage.sql +++ b/sql/2025/accessibility/a11y_technology_usage.sql @@ -1,4 +1,3 @@ -#standardSQL -- Accessibility Technology (A11y) Usage by Client (2025-07-01) -- Google Sheets: a11y_technology_usage -- diff --git a/sql/2025/accessibility/a11y_technology_usage_by_domain_rank.sql b/sql/2025/accessibility/a11y_technology_usage_by_domain_rank.sql index ba70b580578..404f0a2ba43 100644 --- a/sql/2025/accessibility/a11y_technology_usage_by_domain_rank.sql +++ b/sql/2025/accessibility/a11y_technology_usage_by_domain_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Purpose # Measure adoption of specific Accessibility-related technologies (apps/overlays) # across domain rank buckets in the 2025-07-01 HTTP Archive crawl. diff --git a/sql/2025/accessibility/alt_ending_in_image_extension.sql b/sql/2025/accessibility/alt_ending_in_image_extension.sql index b2f5a45819c..9977c8c4fa8 100644 --- a/sql/2025/accessibility/alt_ending_in_image_extension.sql +++ b/sql/2025/accessibility/alt_ending_in_image_extension.sql @@ -1,4 +1,3 @@ -#standardSQL -- Alt Texts Ending in File Extensions (2025-07-01) -- Google Sheet: alt_ending_in_image_extension -- Measures how often alt attributes end in file extensions (e.g., .jpg, .png). diff --git a/sql/2025/accessibility/anchors_with_role_button.sql b/sql/2025/accessibility/anchors_with_role_button.sql index 09b1f42c8b7..384b617f8a0 100644 --- a/sql/2025/accessibility/anchors_with_role_button.sql +++ b/sql/2025/accessibility/anchors_with_role_button.sql @@ -1,4 +1,3 @@ -#standardSQL -- Anchors with role="button" (2025-07-01) -- Google Sheet: anchors_with_role_button -- diff --git a/sql/2025/accessibility/button_name_sources.sql b/sql/2025/accessibility/button_name_sources.sql index b56b803cc9d..0770a62dd31 100644 --- a/sql/2025/accessibility/button_name_sources.sql +++ b/sql/2025/accessibility/button_name_sources.sql @@ -1,4 +1,3 @@ -#standardSQL -- Button Accessible Name Sources (2025-07-01) -- Google Sheet: button_name_sources -- diff --git a/sql/2025/accessibility/color_contrast.sql b/sql/2025/accessibility/color_contrast.sql index a2134b48414..b1d9bbcd5e4 100644 --- a/sql/2025/accessibility/color_contrast.sql +++ b/sql/2025/accessibility/color_contrast.sql @@ -1,4 +1,3 @@ -#standardSQL -- Color Contrast Audit Results (2025-07-01) -- Google Sheet: color_contrast -- diff --git a/sql/2025/accessibility/common_alt_text_length.sql b/sql/2025/accessibility/common_alt_text_length.sql index 2439547f6ab..b4119cb518a 100644 --- a/sql/2025/accessibility/common_alt_text_length.sql +++ b/sql/2025/accessibility/common_alt_text_length.sql @@ -1,4 +1,3 @@ -#standardSQL -- Most common lengths of text (2025-07-01) -- Google Sheets: common_alt_text_length -- diff --git a/sql/2025/accessibility/common_aria_role.sql b/sql/2025/accessibility/common_aria_role.sql index 9a3f98e042e..e050b348a15 100644 --- a/sql/2025/accessibility/common_aria_role.sql +++ b/sql/2025/accessibility/common_aria_role.sql @@ -1,4 +1,3 @@ -#standardSQL # Web Almanac — % of sites using each ARIA role (2025 schema; no JS UDF) # Google Sheet: common_aria_role # diff --git a/sql/2025/accessibility/common_element_attributes.sql b/sql/2025/accessibility/common_element_attributes.sql index a309a53522d..754e8bc06bd 100644 --- a/sql/2025/accessibility/common_element_attributes.sql +++ b/sql/2025/accessibility/common_element_attributes.sql @@ -1,4 +1,3 @@ -#standardSQL # Web Almanac — % of sites using each HTML attribute (2025-07-01; no JS UDF) # Google Sheet: common_element_attributes # diff --git a/sql/2025/accessibility/focus_outline_0.sql b/sql/2025/accessibility/focus_outline_0.sql index 9313b286166..e761c02a983 100644 --- a/sql/2025/accessibility/focus_outline_0.sql +++ b/sql/2025/accessibility/focus_outline_0.sql @@ -1,4 +1,3 @@ -#standardSQL # Web Almanac — Adoption of :focus pseudoclass and outline: 0 style (2025-07-01) # Google Sheet: focus_outline_0 # diff --git a/sql/2025/accessibility/focus_visible.sql b/sql/2025/accessibility/focus_visible.sql index 3b5da15aed2..f188db47340 100644 --- a/sql/2025/accessibility/focus_visible.sql +++ b/sql/2025/accessibility/focus_visible.sql @@ -1,4 +1,3 @@ -#standardSQL # Pages using :focus-visible in CSS (2025 crawl) # Google Sheet: focus_visible # diff --git a/sql/2025/accessibility/lighthouse_a11y_audits.sql b/sql/2025/accessibility/lighthouse_a11y_audits.sql index 82dad705db9..cf91d0c7f0d 100644 --- a/sql/2025/accessibility/lighthouse_a11y_audits.sql +++ b/sql/2025/accessibility/lighthouse_a11y_audits.sql @@ -1,4 +1,3 @@ -#standardSQL # Get summary of all Lighthouse scores for a category CREATE TEMPORARY FUNCTION getAudits(report JSON, category STRING) RETURNS ARRAY> LANGUAGE js AS ''' diff --git a/sql/2025/accessibility/lighthouse_a11y_audits_by_cms.sql b/sql/2025/accessibility/lighthouse_a11y_audits_by_cms.sql index 2d0484f57be..fc6745de967 100644 --- a/sql/2025/accessibility/lighthouse_a11y_audits_by_cms.sql +++ b/sql/2025/accessibility/lighthouse_a11y_audits_by_cms.sql @@ -1,4 +1,3 @@ -#standardSQL # Define the function outside the WITH clause CREATE TEMPORARY FUNCTION getAudits(report JSON, category STRING) RETURNS ARRAY> LANGUAGE js AS ''' diff --git a/sql/2025/accessibility/lighthouse_a11y_score.sql b/sql/2025/accessibility/lighthouse_a11y_score.sql index 2f4b6b3de0e..c53b17ae24c 100644 --- a/sql/2025/accessibility/lighthouse_a11y_score.sql +++ b/sql/2025/accessibility/lighthouse_a11y_score.sql @@ -1,4 +1,3 @@ -#standardSQL # Percentiles of Lighthouse accessibility scores using exact sorting WITH score_data AS ( diff --git a/sql/2025/accessibility/lighthouse_score_by_cms.sql b/sql/2025/accessibility/lighthouse_score_by_cms.sql index 3279b822858..48133b03eaf 100644 --- a/sql/2025/accessibility/lighthouse_score_by_cms.sql +++ b/sql/2025/accessibility/lighthouse_score_by_cms.sql @@ -1,4 +1,3 @@ -#standardSQL # Average Lighthouse scores (performance, accessibility, best-practices, SEO) for top CMS platforms within `httparchive.crawl.pages` WITH score_data AS ( diff --git a/sql/2025/accessibility/lighthouse_score_by_country.sql b/sql/2025/accessibility/lighthouse_score_by_country.sql index 7893edd69cb..866d4a0f6e7 100644 --- a/sql/2025/accessibility/lighthouse_score_by_country.sql +++ b/sql/2025/accessibility/lighthouse_score_by_country.sql @@ -1,4 +1,3 @@ -#standardSQL # Average Lighthouse scores per geo (by country and device) WITH geo_summary AS ( diff --git a/sql/2025/accessibility/lighthouse_score_by_tld.sql b/sql/2025/accessibility/lighthouse_score_by_tld.sql index 803b42a209d..7b59adea333 100644 --- a/sql/2025/accessibility/lighthouse_score_by_tld.sql +++ b/sql/2025/accessibility/lighthouse_score_by_tld.sql @@ -1,4 +1,3 @@ -#standardSQL # Group Lighthouse scores by top-level domain (TLD) WITH tld_score_data AS ( diff --git a/sql/2025/accessibility/media_query_features.sql b/sql/2025/accessibility/media_query_features.sql index e31346035a7..764365e9e69 100644 --- a/sql/2025/accessibility/media_query_features.sql +++ b/sql/2025/accessibility/media_query_features.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMPORARY FUNCTION getMediaQueryFeatures(css JSON) RETURNS ARRAY diff --git a/sql/2025/accessibility/page_title.sql b/sql/2025/accessibility/page_title.sql index 2702770c506..eb65ab75e6a 100644 --- a/sql/2025/accessibility/page_title.sql +++ b/sql/2025/accessibility/page_title.sql @@ -1,4 +1,3 @@ -#standardSQL # Page title stats (usage, descriptive, changed on render) SELECT client, diff --git a/sql/2025/accessibility/pages_with_search_input.sql b/sql/2025/accessibility/pages_with_search_input.sql index 823e584f48a..d0cc54cc3bd 100644 --- a/sql/2025/accessibility/pages_with_search_input.sql +++ b/sql/2025/accessibility/pages_with_search_input.sql @@ -1,4 +1,3 @@ -#standardSQL # Pages with search input CREATE TEMPORARY FUNCTION hasSearchInput(input_elements JSON) RETURNS BOOLEAN LANGUAGE js AS ''' diff --git a/sql/2025/accessibility/placeholder_but_no_label.sql b/sql/2025/accessibility/placeholder_but_no_label.sql index 67a850718bf..2392f9e1ff4 100644 --- a/sql/2025/accessibility/placeholder_but_no_label.sql +++ b/sql/2025/accessibility/placeholder_but_no_label.sql @@ -1,4 +1,3 @@ -#standardSQL # Form controls with placeholder but no label SELECT diff --git a/sql/2025/accessibility/sites_using_role.sql b/sql/2025/accessibility/sites_using_role.sql index bfbb331f233..b58b3503b63 100644 --- a/sql/2025/accessibility/sites_using_role.sql +++ b/sql/2025/accessibility/sites_using_role.sql @@ -1,4 +1,3 @@ -#standardSQL # Sites using the role attribute SELECT diff --git a/sql/2025/accessibility/skip_links.sql b/sql/2025/accessibility/skip_links.sql index b4246157830..cb36b998cb7 100644 --- a/sql/2025/accessibility/skip_links.sql +++ b/sql/2025/accessibility/skip_links.sql @@ -1,4 +1,3 @@ -#standardSQL # % of pages having skip links SELECT diff --git a/sql/2025/accessibility/sr_only_classes.sql b/sql/2025/accessibility/sr_only_classes.sql index 184bacda067..d8e0c5a0f61 100644 --- a/sql/2025/accessibility/sr_only_classes.sql +++ b/sql/2025/accessibility/sr_only_classes.sql @@ -1,4 +1,3 @@ -#standardSQL # Sites using sr-only or visually-hidden classes SELECT diff --git a/sql/2025/accessibility/tabindex_usage_and_values.sql b/sql/2025/accessibility/tabindex_usage_and_values.sql index 3ac32493a32..4ffd0e6f560 100644 --- a/sql/2025/accessibility/tabindex_usage_and_values.sql +++ b/sql/2025/accessibility/tabindex_usage_and_values.sql @@ -1,4 +1,3 @@ -#standardSQL # Positive tabindex value occurrences CREATE TEMPORARY FUNCTION getTotalPositiveTabIndexes(nodes_09_27 JSON) diff --git a/sql/2025/accessibility/table_stats.sql b/sql/2025/accessibility/table_stats.sql index 31ee26f3346..6c2dfe42e10 100644 --- a/sql/2025/accessibility/table_stats.sql +++ b/sql/2025/accessibility/table_stats.sql @@ -1,4 +1,3 @@ -#standardSQL # Table stats. Total all, captioned and presentational SELECT diff --git a/sql/2025/accessibility/units_properties.sql b/sql/2025/accessibility/units_properties.sql index f376fc667d2..92993769613 100644 --- a/sql/2025/accessibility/units_properties.sql +++ b/sql/2025/accessibility/units_properties.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMPORARY FUNCTION getPropertyUnits(css JSON) RETURNS ARRAY> diff --git a/sql/2025/accessibility/valid_html_lang.sql b/sql/2025/accessibility/valid_html_lang.sql index 2890cc58fbe..e364d6fbd88 100644 --- a/sql/2025/accessibility/valid_html_lang.sql +++ b/sql/2025/accessibility/valid_html_lang.sql @@ -1,4 +1,3 @@ -#standardSQL # % of pages with a valid html lang attribute SELECT diff --git a/sql/2025/accessibility/video_track_usage.sql b/sql/2025/accessibility/video_track_usage.sql index 257dac9b4d5..1fe1963812e 100644 --- a/sql/2025/accessibility/video_track_usage.sql +++ b/sql/2025/accessibility/video_track_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Video elements track usage SELECT diff --git a/sql/2025/accessibility/viewport_zoom_scale.sql b/sql/2025/accessibility/viewport_zoom_scale.sql index 17ffb20a1ee..2c591be4f34 100644 --- a/sql/2025/accessibility/viewport_zoom_scale.sql +++ b/sql/2025/accessibility/viewport_zoom_scale.sql @@ -1,4 +1,3 @@ -#standardSQL # Disabled zooming and scaling via the viewport tag -- custom_metrics.other.meta_viewport is blank so use the almanac one instead diff --git a/sql/2025/accessibility/viewport_zoom_scale_by_domain_rank.sql b/sql/2025/accessibility/viewport_zoom_scale_by_domain_rank.sql index cb7e968f0a5..04db0f8510a 100644 --- a/sql/2025/accessibility/viewport_zoom_scale_by_domain_rank.sql +++ b/sql/2025/accessibility/viewport_zoom_scale_by_domain_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Disabled zooming and scaling via the viewport tag -- custom_metrics.other.meta_viewport is blank so use the almanac one instead diff --git a/sql/2025/capabilities/fugu.sql b/sql/2025/capabilities/fugu.sql index a11284c8ff5..ba738d2bf9a 100644 --- a/sql/2025/capabilities/fugu.sql +++ b/sql/2025/capabilities/fugu.sql @@ -1,4 +1,3 @@ -#standardSQL SELECT client, fuguAPI, diff --git a/sql/2025/capabilities/top.sql b/sql/2025/capabilities/top.sql index 4bc6483677a..563db8193ef 100644 --- a/sql/2025/capabilities/top.sql +++ b/sql/2025/capabilities/top.sql @@ -1,4 +1,3 @@ -#standardSQL SELECT client, page, diff --git a/sql/2025/cdn/alt_svc_protocol_analysis.sql b/sql/2025/cdn/alt_svc_protocol_analysis.sql index e6c12928600..0ae66dcacdd 100644 --- a/sql/2025/cdn/alt_svc_protocol_analysis.sql +++ b/sql/2025/cdn/alt_svc_protocol_analysis.sql @@ -1,4 +1,3 @@ -#standardSQL # Alt-Svc Protocol Analysis - Deep dive into Alternative Service headers # Analyzes what protocols are advertised vs actually used diff --git a/sql/2025/cdn/brotli_compression_adoption.sql b/sql/2025/cdn/brotli_compression_adoption.sql index c7f502603cb..272a4b0485e 100644 --- a/sql/2025/cdn/brotli_compression_adoption.sql +++ b/sql/2025/cdn/brotli_compression_adoption.sql @@ -1,4 +1,3 @@ -#standardSQL # 20_brotli_compression_adoption.sql: Brotli and modern compression adoption by CDN # Analyzes compression algorithm usage patterns and efficiency across CDN providers # diff --git a/sql/2025/cdn/cache_control_analysis.sql b/sql/2025/cdn/cache_control_analysis.sql index cbd663a9fa4..37be1d70a89 100644 --- a/sql/2025/cdn/cache_control_analysis.sql +++ b/sql/2025/cdn/cache_control_analysis.sql @@ -1,4 +1,3 @@ -#standardSQL # Cache-Control and CDN caching behavior analysis # Analyzes cache directives and actual caching behavior diff --git a/sql/2025/cdn/cdn_security_features_adoption.sql b/sql/2025/cdn/cdn_security_features_adoption.sql index e539be1a202..039baa0824e 100644 --- a/sql/2025/cdn/cdn_security_features_adoption.sql +++ b/sql/2025/cdn/cdn_security_features_adoption.sql @@ -1,4 +1,3 @@ -#standardSQL # 17_cdn_security_features_adoption.sql: CDN Security Features Adoption # # Rationale: Security is a crucial aspect of content delivery. This query analyzes diff --git a/sql/2025/cdn/cdn_usage_by_site_rank.sql b/sql/2025/cdn/cdn_usage_by_site_rank.sql index bcf36fbe914..b764a1e025c 100644 --- a/sql/2025/cdn/cdn_usage_by_site_rank.sql +++ b/sql/2025/cdn/cdn_usage_by_site_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # cdn_usage_by_site_rank.sql : Distribution of HTML pages served by CDN vs Origin by rank WITH requests AS ( diff --git a/sql/2025/cdn/client_hints/baseline.sql b/sql/2025/cdn/client_hints/baseline.sql index 3ce61f11ae6..3467f1cff00 100644 --- a/sql/2025/cdn/client_hints/baseline.sql +++ b/sql/2025/cdn/client_hints/baseline.sql @@ -1,4 +1,3 @@ -#standardSQL -- Baseline Client Hints adoption metrics for context -- Measures both server-side (Accept-CH) and client-side (Sec-CH-*) adoption DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/client_hints/client_hints_by_cdn.sql b/sql/2025/cdn/client_hints/client_hints_by_cdn.sql index c386173d9e4..8ea3e7374ba 100644 --- a/sql/2025/cdn/client_hints/client_hints_by_cdn.sql +++ b/sql/2025/cdn/client_hints/client_hints_by_cdn.sql @@ -1,4 +1,3 @@ -#standardSQL -- Analyze Client Hints usage by specific CDN provider DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/client_hints/client_hints_by_header.sql b/sql/2025/cdn/client_hints/client_hints_by_header.sql index 5e43fd570f0..d7f643fd9fc 100644 --- a/sql/2025/cdn/client_hints/client_hints_by_header.sql +++ b/sql/2025/cdn/client_hints/client_hints_by_header.sql @@ -1,4 +1,3 @@ -#standardSQL DECLARE d DATE DEFAULT '2025-07-01'; WITH diff --git a/sql/2025/cdn/client_hints/client_hints_cdn_vs_origin.sql b/sql/2025/cdn/client_hints/client_hints_cdn_vs_origin.sql index b7f00906d33..744894841d0 100644 --- a/sql/2025/cdn/client_hints/client_hints_cdn_vs_origin.sql +++ b/sql/2025/cdn/client_hints/client_hints_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL -- Compare Client Hints adoption between CDN and origin requests DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/client_hints/default_vs_requested_hints.sql b/sql/2025/cdn/client_hints/default_vs_requested_hints.sql index d5a2c88f736..7ecfd93a58b 100644 --- a/sql/2025/cdn/client_hints/default_vs_requested_hints.sql +++ b/sql/2025/cdn/client_hints/default_vs_requested_hints.sql @@ -1,4 +1,3 @@ -#standardSQL -- Analyze which Client Hints are sent by default vs. those requiring Accept-CH -- Compares hint usage on pages WITH and WITHOUT Accept-CH header DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/distribution_of_compression_types_by_cdn.sql b/sql/2025/cdn/distribution_of_compression_types_by_cdn.sql index 03f34859cf9..a857daecb79 100644 --- a/sql/2025/cdn/distribution_of_compression_types_by_cdn.sql +++ b/sql/2025/cdn/distribution_of_compression_types_by_cdn.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_compression_types_by_cdn.sql : What compression formats are being used (gzip, brotli, etc) for compressed resources served by CDNs SELECT diff --git a/sql/2025/cdn/distribution_of_compression_types_cdn_vs_origin.sql b/sql/2025/cdn/distribution_of_compression_types_cdn_vs_origin.sql index aaa8b1c8c41..e007d5c57f7 100644 --- a/sql/2025/cdn/distribution_of_compression_types_cdn_vs_origin.sql +++ b/sql/2025/cdn/distribution_of_compression_types_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_compression_types_cdn_vs_origin.sql : What compression formats are being used (gzip, brotli, etc) for compressed resources served by CDNs SELECT diff --git a/sql/2025/cdn/distribution_of_http_versions.sql b/sql/2025/cdn/distribution_of_http_versions.sql index 33dbda47d2c..7b638ff7692 100644 --- a/sql/2025/cdn/distribution_of_http_versions.sql +++ b/sql/2025/cdn/distribution_of_http_versions.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_http_versions: Percentage of HTTPS responses by protocol SELECT a.client, diff --git a/sql/2025/cdn/distribution_of_http_versions_cdn_vs_origin.sql b/sql/2025/cdn/distribution_of_http_versions_cdn_vs_origin.sql index 21fd8ebd26d..df0e2423cfa 100644 --- a/sql/2025/cdn/distribution_of_http_versions_cdn_vs_origin.sql +++ b/sql/2025/cdn/distribution_of_http_versions_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_http_versions_cdn_vs_origin.sql 17_19: Percentage of HTTPS responses by protocol SELECT a.client, diff --git a/sql/2025/cdn/distribution_of_tls_time_by_cdn.sql b/sql/2025/cdn/distribution_of_tls_time_by_cdn.sql index 1884bab3abc..1ef629142f4 100644 --- a/sql/2025/cdn/distribution_of_tls_time_by_cdn.sql +++ b/sql/2025/cdn/distribution_of_tls_time_by_cdn.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_tls_time_by_cdn.sql : Distribution of TLS negotiation time by CDN SELECT client, diff --git a/sql/2025/cdn/distribution_of_tls_time_cdn_vs_origin.sql b/sql/2025/cdn/distribution_of_tls_time_cdn_vs_origin.sql index e2baf7172f1..3c8c15f23db 100644 --- a/sql/2025/cdn/distribution_of_tls_time_cdn_vs_origin.sql +++ b/sql/2025/cdn/distribution_of_tls_time_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_tls_time_cdn_vs_origin.sql : Distribution of TLS negotiation for CDN vs Origin (ie, no CDN) SELECT client, diff --git a/sql/2025/cdn/distribution_of_tls_versions.sql b/sql/2025/cdn/distribution_of_tls_versions.sql index d5d0e8cd2b5..93f1747bcac 100644 --- a/sql/2025/cdn/distribution_of_tls_versions.sql +++ b/sql/2025/cdn/distribution_of_tls_versions.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_tls_versions: Percentage of HTTPS responses by TLS Version and CDN SELECT a.client, diff --git a/sql/2025/cdn/distribution_of_tls_versions_cdn_vs_origin.sql b/sql/2025/cdn/distribution_of_tls_versions_cdn_vs_origin.sql index 51f33b1a5fa..4f11327ed7b 100644 --- a/sql/2025/cdn/distribution_of_tls_versions_cdn_vs_origin.sql +++ b/sql/2025/cdn/distribution_of_tls_versions_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL # distribution_of_tls_versions_cdn_vs_origin: Percentage of HTTPS responses by TLS Version with and without CDN SELECT a.client, diff --git a/sql/2025/cdn/early_hints/baseline.sql b/sql/2025/cdn/early_hints/baseline.sql index 12860b026cf..8142704b651 100644 --- a/sql/2025/cdn/early_hints/baseline.sql +++ b/sql/2025/cdn/early_hints/baseline.sql @@ -1,4 +1,3 @@ -#standardSQL -- Baseline Early Hints (HTTP 103) adoption metrics -- Measures overall adoption of Early Hints responses DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/early_hints/early_hints_by_cdn.sql b/sql/2025/cdn/early_hints/early_hints_by_cdn.sql index e1327da72b2..f9f5087206b 100644 --- a/sql/2025/cdn/early_hints/early_hints_by_cdn.sql +++ b/sql/2025/cdn/early_hints/early_hints_by_cdn.sql @@ -1,4 +1,3 @@ -#standardSQL -- Analyze Early Hints usage by specific CDN provider DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/early_hints/early_hints_cdn_vs_origin.sql b/sql/2025/cdn/early_hints/early_hints_cdn_vs_origin.sql index 31495aa1e48..3ee1bd9c7d6 100644 --- a/sql/2025/cdn/early_hints/early_hints_cdn_vs_origin.sql +++ b/sql/2025/cdn/early_hints/early_hints_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL -- Compare Early Hints adoption between CDN and origin requests DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/early_hints/preload_patterns.sql b/sql/2025/cdn/early_hints/preload_patterns.sql index 71c30068427..fe3cfd47b62 100644 --- a/sql/2025/cdn/early_hints/preload_patterns.sql +++ b/sql/2025/cdn/early_hints/preload_patterns.sql @@ -1,4 +1,3 @@ -#standardSQL -- Analyze common preload patterns in Early Hints -- Shows how many resources are typically preloaded and common combinations DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/early_hints/resource_types_preloaded.sql b/sql/2025/cdn/early_hints/resource_types_preloaded.sql index d5e83517bf7..08dcb3c22cb 100644 --- a/sql/2025/cdn/early_hints/resource_types_preloaded.sql +++ b/sql/2025/cdn/early_hints/resource_types_preloaded.sql @@ -1,4 +1,3 @@ -#standardSQL -- Analyze which resource types are being preloaded via Early Hints -- Shows what types of resources (scripts, styles, fonts, etc.) are prioritized DECLARE d DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/cdn/h3_adoption_by_cdn_provider.sql b/sql/2025/cdn/h3_adoption_by_cdn_provider.sql index e38b8a263bf..92929aa157d 100644 --- a/sql/2025/cdn/h3_adoption_by_cdn_provider.sql +++ b/sql/2025/cdn/h3_adoption_by_cdn_provider.sql @@ -1,4 +1,3 @@ -#standardSQL # h3_adoption_by_cdn_provider_FINAL_v2.sql: HTTP/3 adoption rates by CDN provider # Simplified version without unnecessary isSecure field to avoid casting issues diff --git a/sql/2025/cdn/h3_adoption_by_cdn_vs_origin.sql b/sql/2025/cdn/h3_adoption_by_cdn_vs_origin.sql index cebdf6f56f2..81471dc9c3a 100644 --- a/sql/2025/cdn/h3_adoption_by_cdn_vs_origin.sql +++ b/sql/2025/cdn/h3_adoption_by_cdn_vs_origin.sql @@ -1,4 +1,3 @@ -#standardSQL # h3_adoption_by_cdn_provider_FINAL_v2.sql: HTTP/3 adoption rates by CDN provider # Simplified version without unnecessary isSecure field to avoid casting issues diff --git a/sql/2025/cdn/http3_performance_impact.sql b/sql/2025/cdn/http3_performance_impact.sql index b29eec3f2ca..818744fb918 100644 --- a/sql/2025/cdn/http3_performance_impact.sql +++ b/sql/2025/cdn/http3_performance_impact.sql @@ -1,4 +1,3 @@ -#standardSQL # 33_http3_performance_impact.sql # Comprehensive analysis of HTTP/3 performance impact vs HTTP/2 # Measures real-world performance differences between protocols diff --git a/sql/2025/cdn/security_headers_by_cdn.sql b/sql/2025/cdn/security_headers_by_cdn.sql index 3cf82e7f28f..45b4eab5a9a 100644 --- a/sql/2025/cdn/security_headers_by_cdn.sql +++ b/sql/2025/cdn/security_headers_by_cdn.sql @@ -1,4 +1,3 @@ -#standardSQL # Security headers adoption by CDN vs Origin # Analyzes adoption of key security headers across CDN providers diff --git a/sql/2025/cdn/server_timing_adoption.sql b/sql/2025/cdn/server_timing_adoption.sql index 32bd389cf37..64ba61ba554 100644 --- a/sql/2025/cdn/server_timing_adoption.sql +++ b/sql/2025/cdn/server_timing_adoption.sql @@ -1,4 +1,3 @@ -#standardSQL # 32_server_timing_adoption.sql # Deep dive into Server-Timing header usage across CDNs # Server-Timing provides transparency into server-side performance metrics diff --git a/sql/2025/cdn/top_cdns.sql b/sql/2025/cdn/top_cdns.sql index 574ca9d80fe..0cc69ae72c4 100644 --- a/sql/2025/cdn/top_cdns.sql +++ b/sql/2025/cdn/top_cdns.sql @@ -1,4 +1,3 @@ -#standardSQL # top_cdns.sql: Top CDNs used SELECT year, diff --git a/sql/2025/cdn/top_cdns_by_rank.sql b/sql/2025/cdn/top_cdns_by_rank.sql index c5cae0f7cdb..d44992b52de 100644 --- a/sql/2025/cdn/top_cdns_by_rank.sql +++ b/sql/2025/cdn/top_cdns_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # top_cdns_by_rank.sql: Top CDNs used on the root HTML pages by CrUX rank WITH requests AS ( diff --git a/sql/2025/cdn/usage_of_content_cdns.sql b/sql/2025/cdn/usage_of_content_cdns.sql index be44b77ba80..4f15a7fd55f 100644 --- a/sql/2025/cdn/usage_of_content_cdns.sql +++ b/sql/2025/cdn/usage_of_content_cdns.sql @@ -1,4 +1,3 @@ -#standardSQL # usage_ofcontent_cdns.sql: % of Pages using a library CDN Host SELECT diff --git a/sql/2025/cms/cms_adoption.sql b/sql/2025/cms/cms_adoption.sql index 4f2a70b8620..d5e4aa17c11 100644 --- a/sql/2025/cms/cms_adoption.sql +++ b/sql/2025/cms/cms_adoption.sql @@ -1,4 +1,3 @@ -#standardSQL # CMS adoption OVER time # cms_adoption.sql diff --git a/sql/2025/cms/cms_adoption_by_geo.sql b/sql/2025/cms/cms_adoption_by_geo.sql index 2415f6fdcc8..b817efc85ad 100644 --- a/sql/2025/cms/cms_adoption_by_geo.sql +++ b/sql/2025/cms/cms_adoption_by_geo.sql @@ -1,4 +1,3 @@ -#standardSQL # All CMS popularity per geo # cms_adoption_by_geo.sql diff --git a/sql/2025/cms/cms_adoption_by_rank_all.sql b/sql/2025/cms/cms_adoption_by_rank_all.sql index a217a8842f5..b4804240a76 100644 --- a/sql/2025/cms/cms_adoption_by_rank_all.sql +++ b/sql/2025/cms/cms_adoption_by_rank_all.sql @@ -1,4 +1,3 @@ -#standardSQL # CMS adoption per rank SELECT client, diff --git a/sql/2025/cms/cms_adoption_by_region.sql b/sql/2025/cms/cms_adoption_by_region.sql index 3816fc5b070..a5d4a3254a4 100644 --- a/sql/2025/cms/cms_adoption_by_region.sql +++ b/sql/2025/cms/cms_adoption_by_region.sql @@ -1,4 +1,3 @@ -#standardSQL # ALL CMS popularity per geo CREATE TEMP FUNCTION GET_GEO(country_code STRING, geo STRING) RETURNS STRING diff --git a/sql/2025/cms/cms_adoption_by_subregion.sql b/sql/2025/cms/cms_adoption_by_subregion.sql index 22e8b922248..fdea8fe455c 100644 --- a/sql/2025/cms/cms_adoption_by_subregion.sql +++ b/sql/2025/cms/cms_adoption_by_subregion.sql @@ -1,4 +1,3 @@ -#standardSQL # All CMS popularity per geo CREATE TEMP FUNCTION GET_GEO(country_code STRING, geo STRING) RETURNS STRING LANGUAGE js AS ''' var countries = { diff --git a/sql/2025/cms/image_format_popularity.sql b/sql/2025/cms/image_format_popularity.sql index 683f74e465c..d4e44a5f4b9 100644 --- a/sql/2025/cms/image_format_popularity.sql +++ b/sql/2025/cms/image_format_popularity.sql @@ -1,4 +1,3 @@ -#standardSQL # Image format popularity BY CMS # image_format_popularity.sql diff --git a/sql/2025/cms/lighthouse_category_scores_per_cms.sql b/sql/2025/cms/lighthouse_category_scores_per_cms.sql index aec263c9789..e584bb7b680 100644 --- a/sql/2025/cms/lighthouse_category_scores_per_cms.sql +++ b/sql/2025/cms/lighthouse_category_scores_per_cms.sql @@ -1,4 +1,3 @@ -#standardSQL # Lighthouse category scores per CMS # lighthouse_category_scores_per_cms.sql SELECT diff --git a/sql/2025/cms/lighthouse_category_scores_per_cms_yoy.sql b/sql/2025/cms/lighthouse_category_scores_per_cms_yoy.sql index f2578ea3426..3e19feb88ef 100644 --- a/sql/2025/cms/lighthouse_category_scores_per_cms_yoy.sql +++ b/sql/2025/cms/lighthouse_category_scores_per_cms_yoy.sql @@ -1,4 +1,3 @@ -#standardSQL # Lighthouse category scores per CMS YoY # lighthouse_category_scores_per_cms_yoy.sql SELECT diff --git a/sql/2025/cms/page_weight_distribution.sql b/sql/2025/cms/page_weight_distribution.sql index c25b4f1be94..17bf1e3ed1f 100644 --- a/sql/2025/cms/page_weight_distribution.sql +++ b/sql/2025/cms/page_weight_distribution.sql @@ -1,4 +1,3 @@ -#standardSQL # Total page weight distribution BY CMS # page_weight_distribution.sql SELECT diff --git a/sql/2025/cms/resource_weights.sql b/sql/2025/cms/resource_weights.sql index 91a8783f6eb..a1b058e8cce 100644 --- a/sql/2025/cms/resource_weights.sql +++ b/sql/2025/cms/resource_weights.sql @@ -1,4 +1,3 @@ -#standardSQL # Median resource weights by CMS #resource_weights.sql diff --git a/sql/2025/cms/top_cms.sql b/sql/2025/cms/top_cms.sql index 4d01da5c375..95f0b860618 100644 --- a/sql/2025/cms/top_cms.sql +++ b/sql/2025/cms/top_cms.sql @@ -1,4 +1,3 @@ -#standardSQL # Top CMS platforms, compared to 2020 # top_cms.sql SELECT diff --git a/sql/2025/cms/top_cms_by_geo.sql b/sql/2025/cms/top_cms_by_geo.sql index 8df15b31dc3..4e3c32fecf2 100644 --- a/sql/2025/cms/top_cms_by_geo.sql +++ b/sql/2025/cms/top_cms_by_geo.sql @@ -1,4 +1,3 @@ -#standardSQL # CMS popularity per geo # top_cms_by_geo.sql WITH geo_summary AS ( diff --git a/sql/2025/cms/top_cms_by_rank.sql b/sql/2025/cms/top_cms_by_rank.sql index f1c878b3cbe..0d9f55a9a6f 100644 --- a/sql/2025/cms/top_cms_by_rank.sql +++ b/sql/2025/cms/top_cms_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # CMS adoption per rank # top_cms_by_rank.sql diff --git a/sql/2025/cms/wordpress_page_builders.sql b/sql/2025/cms/wordpress_page_builders.sql index 3babe38be59..2f91079baaf 100644 --- a/sql/2025/cms/wordpress_page_builders.sql +++ b/sql/2025/cms/wordpress_page_builders.sql @@ -1,4 +1,3 @@ -#standardSQL # Top WordPress page builder combinations # wordpress_page_builders.sql diff --git a/sql/2025/cms/wordpress_resources.sql b/sql/2025/cms/wordpress_resources.sql index a314eb48955..a6db35af5c8 100644 --- a/sql/2025/cms/wordpress_resources.sql +++ b/sql/2025/cms/wordpress_resources.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution OF WordPress resource types BY path # wordpress_resources.sql # Updated to use the new crawl dataset diff --git a/sql/2025/generative-ai/ai_tld.sql b/sql/2025/generative-ai/ai_tld.sql index 1e8bc361f2e..493bb8f29d3 100644 --- a/sql/2025/generative-ai/ai_tld.sql +++ b/sql/2025/generative-ai/ai_tld.sql @@ -1,4 +1,3 @@ -#standardSQL # .ai domains per exclusive rank bucket, 2022 vs 2025 WITH base AS ( diff --git a/sql/2025/generative-ai/gradient-client-rank.sql b/sql/2025/generative-ai/gradient-client-rank.sql index 2fef111cb66..0841ff243b8 100644 --- a/sql/2025/generative-ai/gradient-client-rank.sql +++ b/sql/2025/generative-ai/gradient-client-rank.sql @@ -1,8 +1,6 @@ -#standardSQL -- Adoption of CSS gradients in custom_metrics.css_variables -- Grouped by: year, client, rank bucket -#standardSQL -- Adoption of CSS gradients in custom_metrics.css_variables -- Grouped by: year, client, rank bucket diff --git a/sql/2025/generative-ai/gradient-use.sql b/sql/2025/generative-ai/gradient-use.sql index bc78df224db..21f98456c93 100644 --- a/sql/2025/generative-ai/gradient-use.sql +++ b/sql/2025/generative-ai/gradient-use.sql @@ -1,4 +1,3 @@ -#standardSQL -- % of sites whose CSS variables include a gradient( ... ) per year, client, rank -- Goal it use is as an indicator for vibe coded website like "delve into" is used for papers SELECT diff --git a/sql/2025/generative-ai/gradient.sql b/sql/2025/generative-ai/gradient.sql index b4273c78c2c..6aae42e89ed 100644 --- a/sql/2025/generative-ai/gradient.sql +++ b/sql/2025/generative-ai/gradient.sql @@ -1,4 +1,3 @@ -#standardSQL WITH raw_data AS ( SELECT date, diff --git a/sql/2025/generative-ai/sites-with-robot-txt.sql b/sql/2025/generative-ai/sites-with-robot-txt.sql index 2d74dff6a24..889710b91b4 100644 --- a/sql/2025/generative-ai/sites-with-robot-txt.sql +++ b/sql/2025/generative-ai/sites-with-robot-txt.sql @@ -1,4 +1,3 @@ -#standardSQL -- % of sites whose robots.txt returns 200 and includes any directive, therefor the percentage is smaller (75% instead of 95% reported elswhere) WITH roots AS ( SELECT diff --git a/sql/2025/generative-ai/user-agent-named.sql b/sql/2025/generative-ai/user-agent-named.sql index 51f7309dc2e..b85daec43f5 100644 --- a/sql/2025/generative-ai/user-agent-named.sql +++ b/sql/2025/generative-ai/user-agent-named.sql @@ -1,4 +1,3 @@ -#standardSQL # Percent of sites with a given user-agent mentioned in robots.txt, by rank bucket # Returns percentages among (a) all sites and (b) only sites with robots.txt status=200. diff --git a/sql/2025/generative-ai/user-agent-years.sql b/sql/2025/generative-ai/user-agent-years.sql index d8d318ae296..a9b25927fe1 100644 --- a/sql/2025/generative-ai/user-agent-years.sql +++ b/sql/2025/generative-ai/user-agent-years.sql @@ -1,4 +1,3 @@ -#standardSQL -- Percent of sites mentioning each user-agent in robots.txt, over fixed Almanac snapshots CREATE TEMP FUNCTION getByAgent(byua_json JSON, agent STRING) diff --git a/sql/2025/generative-ai/vibecodetools.sql b/sql/2025/generative-ai/vibecodetools.sql index 52a890e34f9..bc19c898b72 100644 --- a/sql/2025/generative-ai/vibecodetools.sql +++ b/sql/2025/generative-ai/vibecodetools.sql @@ -1,4 +1,3 @@ -#standardSQL WITH base AS ( SELECT date, diff --git a/sql/2025/performance/early_hints_usage_rank.sql b/sql/2025/performance/early_hints_usage_rank.sql index 294746758eb..7d8e5f6baca 100644 --- a/sql/2025/performance/early_hints_usage_rank.sql +++ b/sql/2025/performance/early_hints_usage_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Early Hints (HTTP 103) usage by site rank # Measures the percentage of sites using early hints at different popularity ranks diff --git a/sql/2025/performance/early_hints_usage_trends.sql b/sql/2025/performance/early_hints_usage_trends.sql index 90779bd9e0c..479d44249dd 100644 --- a/sql/2025/performance/early_hints_usage_trends.sql +++ b/sql/2025/performance/early_hints_usage_trends.sql @@ -1,4 +1,3 @@ -#standardSQL # Early Hints (HTTP 103) adoption trend over time # Shows usage by client (mobile, desktop) across years diff --git a/sql/2025/performance/generated_content.sql b/sql/2025/performance/generated_content.sql index 5050bdd09c4..27054ea24b3 100644 --- a/sql/2025/performance/generated_content.sql +++ b/sql/2025/performance/generated_content.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMPORARY FUNCTION getGeneratedContent(generatedContent JSON) RETURNS STRUCT LANGUAGE js AS ''' try { diff --git a/sql/2025/performance/generated_content_web_vitals.sql b/sql/2025/performance/generated_content_web_vitals.sql index 76c4d9dd7a3..d4fee1fa950 100644 --- a/sql/2025/performance/generated_content_web_vitals.sql +++ b/sql/2025/performance/generated_content_web_vitals.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMP FUNCTION IS_NON_ZERO(good FLOAT64, needs_improvement FLOAT64, poor FLOAT64) RETURNS BOOL AS ( good + needs_improvement + poor > 0 ); diff --git a/sql/2025/pwa/assetlink_usage.sql b/sql/2025/pwa/assetlink_usage.sql index 4cd80fea436..42782db795f 100644 --- a/sql/2025/pwa/assetlink_usage.sql +++ b/sql/2025/pwa/assetlink_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # assetlink usage SELECT diff --git a/sql/2025/pwa/fugu.sql b/sql/2025/pwa/fugu.sql index d13f02111f8..8911c1ede29 100644 --- a/sql/2025/pwa/fugu.sql +++ b/sql/2025/pwa/fugu.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMP FUNCTION getFuguAPIsFromOther(other_json STRING) RETURNS ARRAY LANGUAGE js AS ''' diff --git a/sql/2025/pwa/manifest_categories.sql b/sql/2025/pwa/manifest_categories.sql index 37b16c3652a..612323d6163 100644 --- a/sql/2025/pwa/manifest_categories.sql +++ b/sql/2025/pwa/manifest_categories.sql @@ -1,4 +1,3 @@ -#standardSQL # Top manifest categories CREATE TEMPORARY FUNCTION getCategories(manifest JSON) RETURNS ARRAY LANGUAGE js AS ''' diff --git a/sql/2025/pwa/manifest_display_values.sql b/sql/2025/pwa/manifest_display_values.sql index 66348f5d619..84ba97f9b0e 100644 --- a/sql/2025/pwa/manifest_display_values.sql +++ b/sql/2025/pwa/manifest_display_values.sql @@ -1,4 +1,3 @@ -#standardSQL # Top most used display values in manifest files CREATE TEMP FUNCTION getDisplay(manifest JSON) RETURNS STRING LANGUAGE js AS ''' diff --git a/sql/2025/pwa/manifest_icon_sizes.sql b/sql/2025/pwa/manifest_icon_sizes.sql index d3333370df5..66d7f48bfe8 100644 --- a/sql/2025/pwa/manifest_icon_sizes.sql +++ b/sql/2025/pwa/manifest_icon_sizes.sql @@ -1,4 +1,3 @@ -#standardSQL # Top manifest icon sizes CREATE TEMPORARY FUNCTION getIconSizes(manifest JSON) RETURNS ARRAY LANGUAGE js AS ''' diff --git a/sql/2025/pwa/manifest_orientations.sql b/sql/2025/pwa/manifest_orientations.sql index 8d828cd0e82..659103c65f2 100644 --- a/sql/2025/pwa/manifest_orientations.sql +++ b/sql/2025/pwa/manifest_orientations.sql @@ -1,4 +1,3 @@ -#standardSQL # Top manifest orientations CREATE TEMP FUNCTION getOrientation(manifest JSON) RETURNS STRING LANGUAGE js AS ''' diff --git a/sql/2025/pwa/manifest_properties.sql b/sql/2025/pwa/manifest_properties.sql index 5c27d6ed692..e34e2d9dc01 100644 --- a/sql/2025/pwa/manifest_properties.sql +++ b/sql/2025/pwa/manifest_properties.sql @@ -1,4 +1,3 @@ -#standardSQL # Top manifest properties CREATE TEMP FUNCTION getManifestProps(manifest JSON) diff --git a/sql/2025/pwa/manifests_and_service_workers.sql b/sql/2025/pwa/manifests_and_service_workers.sql index 17a1d8f14c4..f57247e1c18 100644 --- a/sql/2025/pwa/manifests_and_service_workers.sql +++ b/sql/2025/pwa/manifests_and_service_workers.sql @@ -1,4 +1,3 @@ -#standardSQL # Counting Manifests and Service Workers SELECT client, diff --git a/sql/2025/pwa/manifests_description.sql b/sql/2025/pwa/manifests_description.sql index 5638bdf4d79..cb37bbf489d 100644 --- a/sql/2025/pwa/manifests_description.sql +++ b/sql/2025/pwa/manifests_description.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with description for service worker pages and all pages CREATE TEMP FUNCTION hasDescription(manifest JSON) diff --git a/sql/2025/pwa/manifests_file_handlers.sql b/sql/2025/pwa/manifests_file_handlers.sql index 09b634c5933..715d082976e 100644 --- a/sql/2025/pwa/manifests_file_handlers.sql +++ b/sql/2025/pwa/manifests_file_handlers.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with file handlers for service worker pages and all pages CREATE TEMP FUNCTION hasFileHandlers(manifest JSON) diff --git a/sql/2025/pwa/manifests_iarc.sql b/sql/2025/pwa/manifests_iarc.sql index 6cfc7c0f946..9d86521b9d4 100644 --- a/sql/2025/pwa/manifests_iarc.sql +++ b/sql/2025/pwa/manifests_iarc.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with iarc rating for service worker pages and all pages CREATE TEMP FUNCTION hasIARC(manifest JSON) diff --git a/sql/2025/pwa/manifests_lang.sql b/sql/2025/pwa/manifests_lang.sql index bf0cfb27b95..845955ac090 100644 --- a/sql/2025/pwa/manifests_lang.sql +++ b/sql/2025/pwa/manifests_lang.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with language for service worker pages and all pages DECLARE run_date DATE DEFAULT '2025-07-01'; diff --git a/sql/2025/pwa/manifests_not_json_parsable.sql b/sql/2025/pwa/manifests_not_json_parsable.sql index bcdb547aa2d..e8744a3c326 100644 --- a/sql/2025/pwa/manifests_not_json_parsable.sql +++ b/sql/2025/pwa/manifests_not_json_parsable.sql @@ -1,4 +1,3 @@ -#standardSQL # Manifests that are not JSON parsable for service worker pages and all pages CREATE TEMP FUNCTION canParseManifest(manifest JSON) diff --git a/sql/2025/pwa/manifests_note_taking.sql b/sql/2025/pwa/manifests_note_taking.sql index a6832afb699..f91364206e6 100644 --- a/sql/2025/pwa/manifests_note_taking.sql +++ b/sql/2025/pwa/manifests_note_taking.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with note taking for service worker pages and all pages CREATE TEMP FUNCTION hasNoteTaking(manifest JSON) diff --git a/sql/2025/pwa/manifests_preferring_native_apps.sql b/sql/2025/pwa/manifests_preferring_native_apps.sql index bf4fd78a2a6..65210fb7354 100644 --- a/sql/2025/pwa/manifests_preferring_native_apps.sql +++ b/sql/2025/pwa/manifests_preferring_native_apps.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests preferring native apps for service worker pages and all pages CREATE TEMP FUNCTION prefersNative(manifest JSON) diff --git a/sql/2025/pwa/manifests_protocol_handlers.sql b/sql/2025/pwa/manifests_protocol_handlers.sql index d809d75f560..963efc35f63 100644 --- a/sql/2025/pwa/manifests_protocol_handlers.sql +++ b/sql/2025/pwa/manifests_protocol_handlers.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with protocol handlers for service worker pages and all pages CREATE TEMP FUNCTION hasProtocolHandlers(manifest JSON) diff --git a/sql/2025/pwa/manifests_screenshots.sql b/sql/2025/pwa/manifests_screenshots.sql index 6b1c10c10a5..9ce9c074340 100644 --- a/sql/2025/pwa/manifests_screenshots.sql +++ b/sql/2025/pwa/manifests_screenshots.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with screenshots for service worker pages and all pages CREATE TEMP FUNCTION hasScreenshots(manifest JSON) diff --git a/sql/2025/pwa/manifests_screenshots_platform_narrow.sql b/sql/2025/pwa/manifests_screenshots_platform_narrow.sql index 9e6dca27fbd..f3715b1c611 100644 --- a/sql/2025/pwa/manifests_screenshots_platform_narrow.sql +++ b/sql/2025/pwa/manifests_screenshots_platform_narrow.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with narrow platform screenshots for service worker pages and all pages CREATE TEMP FUNCTION hasScreenshotsPlatformNarrow(manifest JSON) diff --git a/sql/2025/pwa/manifests_screenshots_platform_wide.sql b/sql/2025/pwa/manifests_screenshots_platform_wide.sql index ed3260f51c3..d70234c2c9a 100644 --- a/sql/2025/pwa/manifests_screenshots_platform_wide.sql +++ b/sql/2025/pwa/manifests_screenshots_platform_wide.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with wide platform screenshots for service worker pages and all pages CREATE TEMP FUNCTION hasScreenshotsPlatformWide(manifest JSON) diff --git a/sql/2025/pwa/manifests_share_target.sql b/sql/2025/pwa/manifests_share_target.sql index bf969d13325..306ca48489d 100644 --- a/sql/2025/pwa/manifests_share_target.sql +++ b/sql/2025/pwa/manifests_share_target.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with web share target for service worker pages and all pages CREATE TEMP FUNCTION hasShareTarget(manifest JSON) diff --git a/sql/2025/pwa/manifests_shortcuts.sql b/sql/2025/pwa/manifests_shortcuts.sql index 16f70aef44d..3c4f451120e 100644 --- a/sql/2025/pwa/manifests_shortcuts.sql +++ b/sql/2025/pwa/manifests_shortcuts.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with shortcuts for service worker pages and all pages CREATE TEMP FUNCTION hasShortcuts(manifest JSON) diff --git a/sql/2025/pwa/manifests_window_controls_overlay.sql b/sql/2025/pwa/manifests_window_controls_overlay.sql index 8f674e7a9a6..968340d97a0 100644 --- a/sql/2025/pwa/manifests_window_controls_overlay.sql +++ b/sql/2025/pwa/manifests_window_controls_overlay.sql @@ -1,4 +1,3 @@ -#standardSQL # % manifests with window controls overlay display override for service worker pages and all pages CREATE TEMP FUNCTION hasWindowControlsOverlay(manifest JSON) diff --git a/sql/2025/pwa/popular_pwa_libraries.sql b/sql/2025/pwa/popular_pwa_libraries.sql index a672f809301..d8f9cf1837b 100644 --- a/sql/2025/pwa/popular_pwa_libraries.sql +++ b/sql/2025/pwa/popular_pwa_libraries.sql @@ -1,4 +1,3 @@ -#standardSQL # Popular PWA script (2025) — only crawl/custom_metrics updates, logic identical to 2022 CREATE TEMPORARY FUNCTION getSWLibraries(importScriptsInfo STRING) diff --git a/sql/2025/pwa/popular_pwa_libraries_helper.sql b/sql/2025/pwa/popular_pwa_libraries_helper.sql index 18efad558b1..c812bb7a3f5 100644 --- a/sql/2025/pwa/popular_pwa_libraries_helper.sql +++ b/sql/2025/pwa/popular_pwa_libraries_helper.sql @@ -1,4 +1,3 @@ -#standardSQL # Use this to find popular library imports for popular_pwa_libraries.sql (2025) # Only crawl/custom_metrics updates; logic identical to 2022 diff --git a/sql/2025/pwa/pwa_blink_usage.sql b/sql/2025/pwa/pwa_blink_usage.sql index 52a8700eb7f..ffb6f6c036d 100644 --- a/sql/2025/pwa/pwa_blink_usage.sql +++ b/sql/2025/pwa/pwa_blink_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # PWA features tracked in blink_features.usage (2025) # Only dataset/date update; logic identical to 2022 diff --git a/sql/2025/pwa/pwa_notification_acceptance_rates.sql b/sql/2025/pwa/pwa_notification_acceptance_rates.sql index 3ebb3d4efea..a93b45dd40d 100644 --- a/sql/2025/pwa/pwa_notification_acceptance_rates.sql +++ b/sql/2025/pwa/pwa_notification_acceptance_rates.sql @@ -1,4 +1,3 @@ -#standardSQL # Web Push Notification CRUX stats (10/25/50/75/90/100) for PWA origins — 2025 # Only crawl dataset update; logic identical to 2022 diff --git a/sql/2025/pwa/pwa_notification_acceptance_rates_over_time.sql b/sql/2025/pwa/pwa_notification_acceptance_rates_over_time.sql index aba6647853f..a993bb25939 100644 --- a/sql/2025/pwa/pwa_notification_acceptance_rates_over_time.sql +++ b/sql/2025/pwa/pwa_notification_acceptance_rates_over_time.sql @@ -1,4 +1,3 @@ -#standardSQL # Total Notification Acceptance Rates across all origins — 2025 # Unweighted by origin popularity; logic identical to 2022 diff --git a/sql/2025/pwa/sw_adoption_over_time.sql b/sql/2025/pwa/sw_adoption_over_time.sql index fe18501a893..4404963cb54 100644 --- a/sql/2025/pwa/sw_adoption_over_time.sql +++ b/sql/2025/pwa/sw_adoption_over_time.sql @@ -1,4 +1,3 @@ -#standardSQL # SW controlled pages over time (2025) — dataset same, direct from blink_features.usage SELECT DISTINCT diff --git a/sql/2025/pwa/sw_adoption_over_time_ranking.sql b/sql/2025/pwa/sw_adoption_over_time_ranking.sql index 0b3e9ffaeff..8d573375a73 100644 --- a/sql/2025/pwa/sw_adoption_over_time_ranking.sql +++ b/sql/2025/pwa/sw_adoption_over_time_ranking.sql @@ -1,4 +1,3 @@ -#standardSQL # SW controlled pages by rank (2025) SELECT diff --git a/sql/2025/pwa/sw_events.sql b/sql/2025/pwa/sw_events.sql index f0c84a40b69..3caf46bc166 100644 --- a/sql/2025/pwa/sw_events.sql +++ b/sql/2025/pwa/sw_events.sql @@ -1,4 +1,3 @@ -#standardSQL # SW events (2025) — only crawl/custom_metrics updates CREATE TEMPORARY FUNCTION getSWEvents(pwa STRING) diff --git a/sql/2025/pwa/sw_methods.sql b/sql/2025/pwa/sw_methods.sql index 1719324ee00..1b8a1ef0873 100644 --- a/sql/2025/pwa/sw_methods.sql +++ b/sql/2025/pwa/sw_methods.sql @@ -1,4 +1,3 @@ -#standardSQL # SW methods (2025) — only crawl/custom_metrics updates CREATE TEMPORARY FUNCTION getSWMethods(swMethodsInfo STRING) diff --git a/sql/2025/pwa/sw_objects.sql b/sql/2025/pwa/sw_objects.sql index 68d4d6a6bf4..b9184ec357f 100644 --- a/sql/2025/pwa/sw_objects.sql +++ b/sql/2025/pwa/sw_objects.sql @@ -1,4 +1,3 @@ -#standardSQL # SW objects (2025) — only crawl/custom_metrics updates CREATE TEMPORARY FUNCTION getSWObjects(swObjectsInfo STRING) diff --git a/sql/2025/pwa/sw_objects_name_only.sql b/sql/2025/pwa/sw_objects_name_only.sql index dc3747374ba..ee1fbc629ed 100644 --- a/sql/2025/pwa/sw_objects_name_only.sql +++ b/sql/2025/pwa/sw_objects_name_only.sql @@ -1,4 +1,3 @@ -#standardSQL # SW objects (name only) — 2025 CREATE TEMPORARY FUNCTION getSWObjects(swObjectsInfo STRING) diff --git a/sql/2025/pwa/sw_registration_properties.sql b/sql/2025/pwa/sw_registration_properties.sql index c36e256dda4..0fbb264916f 100644 --- a/sql/2025/pwa/sw_registration_properties.sql +++ b/sql/2025/pwa/sw_registration_properties.sql @@ -1,4 +1,3 @@ -#standardSQL # SW registration properties (2025) CREATE TEMPORARY FUNCTION getSWRegistrationProperties(info STRING) diff --git a/sql/2025/pwa/sw_registration_properties_name_only.sql b/sql/2025/pwa/sw_registration_properties_name_only.sql index 4c7e6bc3864..da6a0e84781 100644 --- a/sql/2025/pwa/sw_registration_properties_name_only.sql +++ b/sql/2025/pwa/sw_registration_properties_name_only.sql @@ -1,4 +1,3 @@ -#standardSQL # SW registration properties (name only) — 2025 CREATE TEMPORARY FUNCTION getSWRegistrationProperties(info STRING) diff --git a/sql/2025/pwa/workbox_methods.sql b/sql/2025/pwa/workbox_methods.sql index 21aa60c3708..3a715dd0f5b 100644 --- a/sql/2025/pwa/workbox_methods.sql +++ b/sql/2025/pwa/workbox_methods.sql @@ -1,4 +1,3 @@ -#standardSQL # Workbox methods (2025) CREATE TEMPORARY FUNCTION getWorkboxMethods(workboxInfo STRING) diff --git a/sql/2025/pwa/workbox_packages.sql b/sql/2025/pwa/workbox_packages.sql index f53c7152970..76d89128462 100644 --- a/sql/2025/pwa/workbox_packages.sql +++ b/sql/2025/pwa/workbox_packages.sql @@ -1,4 +1,3 @@ -#standardSQL # Workbox package and methods (2025) CREATE TEMPORARY FUNCTION getWorkboxPackages(workboxInfo STRING) diff --git a/sql/2025/pwa/workbox_usage.sql b/sql/2025/pwa/workbox_usage.sql index 86cc6b8134e..f25807f57ec 100644 --- a/sql/2025/pwa/workbox_usage.sql +++ b/sql/2025/pwa/workbox_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Workbox usage (2025) SELECT diff --git a/sql/2025/pwa/workbox_versions.sql b/sql/2025/pwa/workbox_versions.sql index a5ea2269c5c..e6ebb86532e 100644 --- a/sql/2025/pwa/workbox_versions.sql +++ b/sql/2025/pwa/workbox_versions.sql @@ -1,4 +1,3 @@ -#standardSQL # Workbox versions (2025) CREATE TEMPORARY FUNCTION getWorkboxVersions(workboxInfo STRING) diff --git a/sql/2025/security/audit_issues.sql b/sql/2025/security/audit_issues.sql index 081b3e2c4ab..0950482b76f 100644 --- a/sql/2025/security/audit_issues.sql +++ b/sql/2025/security/audit_issues.sql @@ -1,4 +1,3 @@ -#standardSQL # Question: What Audit issues are present in the pages? https://chromedevtools.github.io/devtools-protocol/tot/Audits/#type-InspectorIssueCode SELECT client, diff --git a/sql/2025/security/bot_detection.sql b/sql/2025/security/bot_detection.sql index 0ddb6daf856..67884984ca0 100644 --- a/sql/2025/security/bot_detection.sql +++ b/sql/2025/security/bot_detection.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Bot protection services # Question: Which bot protection services are used most often on mobile and desktop sites? # Notes: The Wappalyzer 'Security' category mostly contains bot protection services such as reCAPTCHA and Cloudflare Bot Management diff --git a/sql/2025/security/clear-site-data_value_prevalence.sql b/sql/2025/security/clear-site-data_value_prevalence.sql index 2c9a366afc6..84c074b4680 100644 --- a/sql/2025/security/clear-site-data_value_prevalence.sql +++ b/sql/2025/security/clear-site-data_value_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using Clear-Site-Data # Question: Which Clear-Site-Data header values are most prevalent? # Notes: Many used values are still invalid (without quotes). We only count each host-value pair once. diff --git a/sql/2025/security/coep_header_prevalence.sql b/sql/2025/security/coep_header_prevalence.sql index 73be26b23de..520cd6eec7b 100644 --- a/sql/2025/security/coep_header_prevalence.sql +++ b/sql/2025/security/coep_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Preventing attacks using Cross-Origin policies # Question: Which are the most common COEP values? # Note: Considers headers of main document responses only diff --git a/sql/2025/security/cookie_age_negative.sql b/sql/2025/security/cookie_age_negative.sql index 0eee8728dcc..e9004c56f46 100644 --- a/sql/2025/security/cookie_age_negative.sql +++ b/sql/2025/security/cookie_age_negative.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Cookies - Cookie Age # Question: How many cookies (total, hosts, pages) have negative Max-Age, Expires and real age (Max-Age has precedence over Expires) attributes? # Note: Query is expensive and slow (14TB). Query is inefficient (We create a result array of length 1 for each cookie-attribute for each cookie and then unnest it again; We could instead not use arrays and skip the unnesting). diff --git a/sql/2025/security/cookie_age_percentiles.sql b/sql/2025/security/cookie_age_percentiles.sql index 8a8f260843f..8b0983e4817 100644 --- a/sql/2025/security/cookie_age_percentiles.sql +++ b/sql/2025/security/cookie_age_percentiles.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Cookies - Cookie Age # Question: How long are cookies valid? (Max-Age, Expires, Real Age) # Note: Only incorporates values that are larger than 0; cookies set over all all requests on the root_page diff --git a/sql/2025/security/cookie_attributes.sql b/sql/2025/security/cookie_attributes.sql index d6abb13ef6f..958f4d52886 100644 --- a/sql/2025/security/cookie_attributes.sql +++ b/sql/2025/security/cookie_attributes.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Cookies - Cookie Attributes # Question: What is the prevalence of cookie attributes (HttpOnly, Secure, SameSite, __Secure-, __Host- prefixes, ...) for cookies set on first-party and third-party requests? # Note: NET.REG_DOMAIN does not use the private section of publicsuffix.org (e.g., all *.github.io sites are counted as the same party) diff --git a/sql/2025/security/cookie_max_age_expires_top_values.sql b/sql/2025/security/cookie_max_age_expires_top_values.sql index fb4c6143638..de3ab667a77 100644 --- a/sql/2025/security/cookie_max_age_expires_top_values.sql +++ b/sql/2025/security/cookie_max_age_expires_top_values.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Cookies - Cookie Age # Question: Which are the most common Max-Age and Expires cookie attribute values? # Note: Expensive query could be combined with the other cookie queries to only go over the cookie headers once. diff --git a/sql/2025/security/coop_header_prevalence.sql b/sql/2025/security/coop_header_prevalence.sql index e79319a3e1c..d89a8712788 100644 --- a/sql/2025/security/coop_header_prevalence.sql +++ b/sql/2025/security/coop_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Preventing attacks using Cross-Origin policies # Question: Which are the most common COOP values? # Note: Considers headers of main document responses only diff --git a/sql/2025/security/corp_header_prevalence.sql b/sql/2025/security/corp_header_prevalence.sql index b63853ccbe4..3f50e375a68 100644 --- a/sql/2025/security/corp_header_prevalence.sql +++ b/sql/2025/security/corp_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Preventing attacks using Cross-Origin policies # Question: Which are the most common CORP values? # Note: Considers headers of all responses including all subresources (header is used for script and img resources) diff --git a/sql/2025/security/cryptominer_share.sql b/sql/2025/security/cryptominer_share.sql index 536d4cc6390..08eed6e572c 100644 --- a/sql/2025/security/cryptominer_share.sql +++ b/sql/2025/security/cryptominer_share.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Malpractices on the web # Question: Which cryptominers have the largest market share? SELECT diff --git a/sql/2025/security/cryptominer_usage.sql b/sql/2025/security/cryptominer_usage.sql index bdf3e22ef82..099d12e5849 100644 --- a/sql/2025/security/cryptominer_usage.sql +++ b/sql/2025/security/cryptominer_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Malpractices on the web # Question: How many sites used cryptominers over time? # Note: The usage is very low, so maybe we want to drop this query. Also unclear which starting date we want diff --git a/sql/2025/security/csp_allowed_host_frequency.sql b/sql/2025/security/csp_allowed_host_frequency.sql index ab50df2e1e6..398429c4ba1 100644 --- a/sql/2025/security/csp_allowed_host_frequency.sql +++ b/sql/2025/security/csp_allowed_host_frequency.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Question: Which are the most common "allowed host" values in CSPs on home pages? WITH totals AS ( diff --git a/sql/2025/security/csp_allowed_host_frequency_wss.sql b/sql/2025/security/csp_allowed_host_frequency_wss.sql index 2906a7abb75..7a27b0d2e0e 100644 --- a/sql/2025/security/csp_allowed_host_frequency_wss.sql +++ b/sql/2025/security/csp_allowed_host_frequency_wss.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Question: Which are the most common WSS "allowed host" values in CSPs on home pages? WITH totals AS ( diff --git a/sql/2025/security/csp_directives_usage.sql b/sql/2025/security/csp_directives_usage.sql index 39dbbb3f506..1ff37f44135 100644 --- a/sql/2025/security/csp_directives_usage.sql +++ b/sql/2025/security/csp_directives_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Question: Which are the most common CSP directives on home pages? SELECT diff --git a/sql/2025/security/csp_features.sql b/sql/2025/security/csp_features.sql index 5b39b088c93..862fa30e310 100644 --- a/sql/2025/security/csp_features.sql +++ b/sql/2025/security/csp_features.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Question: Discrepancy between declared and effective CSP, using BlinkFeatures SELECT diff --git a/sql/2025/security/csp_most_common_header.sql b/sql/2025/security/csp_most_common_header.sql index 6ebd9f01b3b..812a6199bad 100644 --- a/sql/2025/security/csp_most_common_header.sql +++ b/sql/2025/security/csp_most_common_header.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Preventing attacks using CSP # Question: Which are the most common CSP values on home pages? # Note: Only considers CSPs of the home page and not of embedded resources diff --git a/sql/2025/security/csp_number_of_allowed_hosts.sql b/sql/2025/security/csp_number_of_allowed_hosts.sql index 3be7ecbb525..9f308ad9191 100644 --- a/sql/2025/security/csp_number_of_allowed_hosts.sql +++ b/sql/2025/security/csp_number_of_allowed_hosts.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Preventing attacks using CSP # Question: CSP on home pages: number of unique headers, header length and number of allowed HTTP(S) hosts in all directives # Note: for CSP we checked whether the header value is NULL (empty?) (99.65% of CSP headers are not NULL on desktop), we did not do this for other headers? diff --git a/sql/2025/security/csp_script_source_list_keywords_per_header.sql b/sql/2025/security/csp_script_source_list_keywords_per_header.sql index c6798b2764a..b320da2100f 100644 --- a/sql/2025/security/csp_script_source_list_keywords_per_header.sql +++ b/sql/2025/security/csp_script_source_list_keywords_per_header.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Note: This query counts multiple CSP headers per request seperately. # Question: usage of default/script-src, and within the directive usage of strict-dynamic, nonce values, unsafe-inline and unsafe-eval diff --git a/sql/2025/security/csp_script_source_list_keywords_per_request.sql b/sql/2025/security/csp_script_source_list_keywords_per_request.sql index d472e093296..1a5f637e57c 100644 --- a/sql/2025/security/csp_script_source_list_keywords_per_request.sql +++ b/sql/2025/security/csp_script_source_list_keywords_per_request.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using CSP # Note: This query combines multiple CSP headers per request into one. # Question: usage of default/script-src, and within the directive usage of strict-dynamic, nonce values, unsafe-inline and unsafe-eval diff --git a/sql/2025/security/documentdomain_usage.sql b/sql/2025/security/documentdomain_usage.sql index 082281add18..dd7be95fbb9 100644 --- a/sql/2025/security/documentdomain_usage.sql +++ b/sql/2025/security/documentdomain_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Security Headers? (document.domain feature) # Question: How often is document.domain still used even though deprecated? # Note: Possible to port to httparchive.all.pages, however would require to recreate num_urls, total_urls, and pct_urls diff --git a/sql/2025/security/documentpolicy_most_common_header.sql b/sql/2025/security/documentpolicy_most_common_header.sql index f377d7a2e05..3148ac093a6 100644 --- a/sql/2025/security/documentpolicy_most_common_header.sql +++ b/sql/2025/security/documentpolicy_most_common_header.sql @@ -1,4 +1,3 @@ -#standardSQL # Question: Which are the most common document policy values on home pages? # Note: Only considers document policies of the home page and not of embedded resources # Note: There is no registry of possible directives, see https://github.com/WICG/document-policy/blob/main/integration.md diff --git a/sql/2025/security/feature_adoption_by_category.sql b/sql/2025/security/feature_adoption_by_category.sql index f6225d07977..0b73fd40106 100644 --- a/sql/2025/security/feature_adoption_by_category.sql +++ b/sql/2025/security/feature_adoption_by_category.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanism adoption - Website Category # Question: How is security feature adoption and category of a website related? # Note: Not all headers have their individual percentages diff --git a/sql/2025/security/feature_adoption_by_country.sql b/sql/2025/security/feature_adoption_by_country.sql index 2f39ec296b6..b49d49b3bfa 100644 --- a/sql/2025/security/feature_adoption_by_country.sql +++ b/sql/2025/security/feature_adoption_by_country.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanism adoption - Location of a website # Question: How is security feature adoption and location of a website related (i.e. which is the most common country visiting that website)? # Note: Security feature adoption grouped by sites frequently visited from different countries diff --git a/sql/2025/security/feature_adoption_by_other_features.sql b/sql/2025/security/feature_adoption_by_other_features.sql index c3d5a3cfd9a..9f4626f12be 100644 --- a/sql/2025/security/feature_adoption_by_other_features.sql +++ b/sql/2025/security/feature_adoption_by_other_features.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanism adoption - Other Headers? # Question: Which features (mostly security headers) influence the adoption of other features? # Note: Query seems unnatural after the port; Add other (new) features? diff --git a/sql/2025/security/feature_adoption_by_technology.sql b/sql/2025/security/feature_adoption_by_technology.sql index 1848864089b..5862e9dc31f 100644 --- a/sql/2025/security/feature_adoption_by_technology.sql +++ b/sql/2025/security/feature_adoption_by_technology.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Driveres of security mechanism - Technology stack # Question: How are security features and used technology correlated? # Note: Adoption of features based on the technology that is used diff --git a/sql/2025/security/fp_header_prevalence.sql b/sql/2025/security/fp_header_prevalence.sql index 975680e5986..83edf13d499 100644 --- a/sql/2025/security/fp_header_prevalence.sql +++ b/sql/2025/security/fp_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: ? (Permissions) # Question: Which are the most common FP values? # Note: Considers headers of main document responses diff --git a/sql/2025/security/home_page_https_usage.sql b/sql/2025/security/home_page_https_usage.sql index e316d4ee887..2f12155e81c 100644 --- a/sql/2025/security/home_page_https_usage.sql +++ b/sql/2025/security/home_page_https_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transpont Security - Protocol versions # Question: How many websites (home pages only) use HTTP vs HTTPS? SELECT diff --git a/sql/2025/security/hsts_attributes.sql b/sql/2025/security/hsts_attributes.sql index f66ace84a8a..24c0bafe31f 100644 --- a/sql/2025/security/hsts_attributes.sql +++ b/sql/2025/security/hsts_attributes.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - HTTP Strict Transport Security # Question: How many websites use HSTS includeSubDomains and preload? SELECT diff --git a/sql/2025/security/hsts_max_age_percentiles.sql b/sql/2025/security/hsts_max_age_percentiles.sql index 1ded69139cd..72c8ca51213 100644 --- a/sql/2025/security/hsts_max_age_percentiles.sql +++ b/sql/2025/security/hsts_max_age_percentiles.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - HTTP Strict Transport Security # Question: What is the distribution of max-age values for HSTS? SELECT diff --git a/sql/2025/security/html_sanitization_usage.sql b/sql/2025/security/html_sanitization_usage.sql index 72f8f78ca5b..1259ffa57cb 100644 --- a/sql/2025/security/html_sanitization_usage.sql +++ b/sql/2025/security/html_sanitization_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - HTML Sanitization # Question: How often is setHTMLUnsafe and parseHTMLUnsafe used? # Note: Possible to port to httparchive.all.pages, however would require to recreate num_urls, total_urls, and pct_urls diff --git a/sql/2025/security/https_request_over_time.sql b/sql/2025/security/https_request_over_time.sql index 644056aecb8..4770319f629 100644 --- a/sql/2025/security/https_request_over_time.sql +++ b/sql/2025/security/https_request_over_time.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - ? # Question: How many requests are made via HTTPS over time? # Note: Currently all requests on the landing page; could be restricted to top-level requests only (is_main_document) diff --git a/sql/2025/security/https_server_redirects.sql b/sql/2025/security/https_server_redirects.sql index 9cf05330351..d32446e1435 100644 --- a/sql/2025/security/https_server_redirects.sql +++ b/sql/2025/security/https_server_redirects.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Unused? # Question: How many HTTP requests exist on pages and how many of them server-side redirect to HTTPS # Note: Does not distinguish between whether the main Page URL is HTTP or HTTPS diff --git a/sql/2025/security/iframe_allow_directive_values.sql b/sql/2025/security/iframe_allow_directive_values.sql index 35fcd2aa8f2..5d819ddc733 100644 --- a/sql/2025/security/iframe_allow_directive_values.sql +++ b/sql/2025/security/iframe_allow_directive_values.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Permissions Policy # Question: Which are the most prominent directives/directive-value pairs for the allow attributes on iframes? CREATE TEMP FUNCTION getNumWithAllowAttribute(payload ARRAY) AS (( diff --git a/sql/2025/security/iframe_allow_directives.sql b/sql/2025/security/iframe_allow_directives.sql index 118909ecbc2..27ba5e4347b 100644 --- a/sql/2025/security/iframe_allow_directives.sql +++ b/sql/2025/security/iframe_allow_directives.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Permissions Policy # Question: Which are the most prominent directives for the allow attributes on iframes? CREATE TEMP FUNCTION getNumWithAllowAttribute(payload ARRAY) AS (( diff --git a/sql/2025/security/iframe_attribute_popular_hosts.sql b/sql/2025/security/iframe_attribute_popular_hosts.sql index 207d433b099..2ea84e5ce71 100644 --- a/sql/2025/security/iframe_attribute_popular_hosts.sql +++ b/sql/2025/security/iframe_attribute_popular_hosts.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Iframe Sandbox/Permissions Policy # Question: Wich are the most commont hostnames of iframes that have an allow or sandbox attribute? CREATE TEMP FUNCTION hasPolicy(attr STRING, policy_type STRING) diff --git a/sql/2025/security/iframe_attributes_usage.sql b/sql/2025/security/iframe_attributes_usage.sql index 73456eabbcd..1c862103ef6 100644 --- a/sql/2025/security/iframe_attributes_usage.sql +++ b/sql/2025/security/iframe_attributes_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Iframe Sandbox/Permissions Policy # Question: How often are the allow and sandbox attributes used on iframes? Both per page (used in at least one iframe on a page) and over all iframe elements WITH total_iframe_count AS ( diff --git a/sql/2025/security/iframe_attributes_usage_fix.sql b/sql/2025/security/iframe_attributes_usage_fix.sql index 67751b4af41..b0bffe11a33 100644 --- a/sql/2025/security/iframe_attributes_usage_fix.sql +++ b/sql/2025/security/iframe_attributes_usage_fix.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Iframe Sandbox/Permissions Policy # Question: How often are the allow and sandbox attributes used on iframes? Both per page (used in at least one iframe on a page) and over all iframe elements WITH total_iframe_count AS ( diff --git a/sql/2025/security/iframe_sandbox_directives.sql b/sql/2025/security/iframe_sandbox_directives.sql index 0f3c135bc5b..d9d218bc5cf 100644 --- a/sql/2025/security/iframe_sandbox_directives.sql +++ b/sql/2025/security/iframe_sandbox_directives.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Iframe Sandbox # Question: Which are the most common directives for the sandbox attribute on iframes? CREATE TEMP FUNCTION getNumWithSandboxAttribute(payload ARRAY) AS (( diff --git a/sql/2025/security/meta_csp_disallowed_directives.sql b/sql/2025/security/meta_csp_disallowed_directives.sql index a7bcf57890f..b64972ee51e 100644 --- a/sql/2025/security/meta_csp_disallowed_directives.sql +++ b/sql/2025/security/meta_csp_disallowed_directives.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Security misconfigurations - CSP directives that are ignored in # Question: How many pages use invalid CSP directives in ? # Note: uses the old payload._almanac metric location instead of custom_metrics.almanac (also the meta-nodes metric is in the generic almanac.js custom metric) diff --git a/sql/2025/security/meta_policies_allowed_vs_disallowed.sql b/sql/2025/security/meta_policies_allowed_vs_disallowed.sql index 9ffa77b8f0b..dd43308ecf9 100644 --- a/sql/2025/security/meta_policies_allowed_vs_disallowed.sql +++ b/sql/2025/security/meta_policies_allowed_vs_disallowed.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Preventing attacks using # Question: How many pages use security policies in meta tags (both allowed and ignored ones) # Note: uses the old payload._almanac metric location instead of custom_metrics.almanac (also the meta-nodes metric is in the generic almanac.js custom metric) diff --git a/sql/2025/security/mimetype_file_extension_mismatch.sql b/sql/2025/security/mimetype_file_extension_mismatch.sql index 41e4e82011a..40a29bef000 100644 --- a/sql/2025/security/mimetype_file_extension_mismatch.sql +++ b/sql/2025/security/mimetype_file_extension_mismatch.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: unclear # Question: How often does the mimetype of a request and the file extension mismatch across all requests? # Note: Non-SVG images are ignored diff --git a/sql/2025/security/mixed_content.sql b/sql/2025/security/mixed_content.sql index 8af6b8d88d7..aa5314b77fe 100644 --- a/sql/2025/security/mixed_content.sql +++ b/sql/2025/security/mixed_content.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - ? # Question: How many landing pages that load over HTTPS have at least one reference over HTTP? (Distributed across ranking) # Note: Each rank bucket does not include lower buckets; diff --git a/sql/2025/security/oac_header_prevalence.sql b/sql/2025/security/oac_header_prevalence.sql index 745f0ca593a..e6c6863fd34 100644 --- a/sql/2025/security/oac_header_prevalence.sql +++ b/sql/2025/security/oac_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Security Header Adoptions? # Question: Which are the most common OAC values? # Note: Considers headers of all main document responses diff --git a/sql/2025/security/pp_header_prevalence.sql b/sql/2025/security/pp_header_prevalence.sql index 91c6c2218da..deb47fa7e8b 100644 --- a/sql/2025/security/pp_header_prevalence.sql +++ b/sql/2025/security/pp_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: ? (Permissions) # Question: Which are the most common PP values? # Note: Considers headers of main document responses diff --git a/sql/2025/security/robot_header_and_meta_tag_prevalence.sql b/sql/2025/security/robot_header_and_meta_tag_prevalence.sql index 0b004d8baa8..086805ba49c 100644 --- a/sql/2025/security/robot_header_and_meta_tag_prevalence.sql +++ b/sql/2025/security/robot_header_and_meta_tag_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Unclear? # Question: What is the prevalence of robots meta tag values and the X-robots-tag header? WITH meta_tags AS ( diff --git a/sql/2025/security/robot_txt_sensitive_disallow.sql b/sql/2025/security/robot_txt_sensitive_disallow.sql index 4fea944291a..699210970b8 100644 --- a/sql/2025/security/robot_txt_sensitive_disallow.sql +++ b/sql/2025/security/robot_txt_sensitive_disallow.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Well-know URIs - robots.txt (?) # Question: What is the prevalence of /robots.txt and what is the prevalence of potentially sensitive endpoints in disallow directives ('login', 'log-in', 'signin', 'sign-in', 'admin', 'auth', 'sso', 'account') CREATE TEMPORARY FUNCTION getAllDisallowedEndpoints(data JSON) diff --git a/sql/2025/security/security_adoption_by_category.sql b/sql/2025/security/security_adoption_by_category.sql index 719e567c351..dc397ed5822 100644 --- a/sql/2025/security/security_adoption_by_category.sql +++ b/sql/2025/security/security_adoption_by_category.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanism adoption - Website category # Question: How prevalent are the various security headers on first-party resources? (per category) # Note: Instead of the parent_category, we could ues full_category or subcategory (https://har.fyi/reference/functions/get_host_categories/) diff --git a/sql/2025/security/security_adoption_by_rank.sql b/sql/2025/security/security_adoption_by_rank.sql index 9aa144cf3f3..636e81b404d 100644 --- a/sql/2025/security/security_adoption_by_rank.sql +++ b/sql/2025/security/security_adoption_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanism adoption - Website popularity # Question: How prevalent are the various security headers on first-party resources? (per rank grouping 1K, 5K, 10K, 100K, 500K, 1M, ...) # Note: Buckets do not include prior ranks diff --git a/sql/2025/security/security_headers_prevalence.sql b/sql/2025/security/security_headers_prevalence.sql index 7c6c56313a9..0e16d69a61d 100644 --- a/sql/2025/security/security_headers_prevalence.sql +++ b/sql/2025/security/security_headers_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Security header adoptions # Question: How prevalent are security headers in a first-party context? (count by number of hosts) # Note: Instead we could only look at top-level responses (is_main_document)? diff --git a/sql/2025/security/server_header_value_prevalence.sql b/sql/2025/security/server_header_value_prevalence.sql index 2cc3e2fc0a4..2647b3dc232 100644 --- a/sql/2025/security/server_header_value_prevalence.sql +++ b/sql/2025/security/server_header_value_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: ? # Question: Which are the most common Server and X-Powered-By headers? (count by number of hosts) # Note: Different dates taken together; Is it correct to take the host of the page instead of the URL? Maybe only take is_main_document? diff --git a/sql/2025/security/server_information_header_prevalence.sql b/sql/2025/security/server_information_header_prevalence.sql index 07c9cfee5d9..d968414a55c 100644 --- a/sql/2025/security/server_information_header_prevalence.sql +++ b/sql/2025/security/server_information_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: ? # Question: How prevalent are headers leaking server information? (count by number of hosts) SELECT diff --git a/sql/2025/security/server_timing_usage_values.sql b/sql/2025/security/server_timing_usage_values.sql index 275d12c9458..25e82ef648d 100644 --- a/sql/2025/security/server_timing_usage_values.sql +++ b/sql/2025/security/server_timing_usage_values.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Security misconfigurations and oversights - (Missing) suppression of 'Server-Timing' header # Question: Which are the most common server-timing headers and how often are they used in total? # Note: Probably better to split some of the things up to make the interpretation of the results easier diff --git a/sql/2025/security/sri_coverage_per_page.sql b/sql/2025/security/sri_coverage_per_page.sql index a2671b0aa6e..04d2f488297 100644 --- a/sql/2025/security/sri_coverage_per_page.sql +++ b/sql/2025/security/sri_coverage_per_page.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Subresource Integriy # Question: How many scripts on a page have the integrity attribute? (percentage) CREATE TEMP FUNCTION getNumScriptElements(sris ARRAY) AS ( diff --git a/sql/2025/security/sri_hash_functions.sql b/sql/2025/security/sri_hash_functions.sql index 19c05306e97..7319d3df632 100644 --- a/sql/2025/security/sri_hash_functions.sql +++ b/sql/2025/security/sri_hash_functions.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Subresource Integrity # Question: Wich are the most common SRI hash functions used? WITH totals AS ( diff --git a/sql/2025/security/sri_popular_hosts.sql b/sql/2025/security/sri_popular_hosts.sql index 5cb8d56818b..27e1820c975 100644 --- a/sql/2025/security/sri_popular_hosts.sql +++ b/sql/2025/security/sri_popular_hosts.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Subresource Integrity # Question: Which are the most popular hosts for which SRI is used on script tags? WITH totals AS ( diff --git a/sql/2025/security/sri_usage.sql b/sql/2025/security/sri_usage.sql index e3cbe74a386..e39c8699efb 100644 --- a/sql/2025/security/sri_usage.sql +++ b/sql/2025/security/sri_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Content Inclusion - Subresource Integrity # Question: How many pages use SRI (per tagname) and what is the tagname usage for all SRI elements? SELECT diff --git a/sql/2025/security/tao_header_prevalence.sql b/sql/2025/security/tao_header_prevalence.sql index ac43bc727af..be703c0ffce 100644 --- a/sql/2025/security/tao_header_prevalence.sql +++ b/sql/2025/security/tao_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Security Header Adoptions? # Question: Which are the most common TAO values? # Note: Considers headers of all responses including all subresources (header is used for script and img resources) diff --git a/sql/2025/security/tls_ca_expired_cert.sql b/sql/2025/security/tls_ca_expired_cert.sql index dc451beee00..3c96cbf2b12 100644 --- a/sql/2025/security/tls_ca_expired_cert.sql +++ b/sql/2025/security/tls_ca_expired_cert.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Certificate Authority # Question: How many certificates are expired? # Note: currently includes HTTP (i.e., pages with no issuer) diff --git a/sql/2025/security/tls_ca_issuers_pages.sql b/sql/2025/security/tls_ca_issuers_pages.sql index 7546ef39d14..6af73e1df41 100644 --- a/sql/2025/security/tls_ca_issuers_pages.sql +++ b/sql/2025/security/tls_ca_issuers_pages.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Certificate Authority # Question: What is the distribution of CA issuers for all pages? # Note: currently includes HTTP (i.e., pages with no issuer) diff --git a/sql/2025/security/tls_ca_issuers_pages_over_time.sql b/sql/2025/security/tls_ca_issuers_pages_over_time.sql index 2a7ff496963..36157b0442c 100644 --- a/sql/2025/security/tls_ca_issuers_pages_over_time.sql +++ b/sql/2025/security/tls_ca_issuers_pages_over_time.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Certificate Authority # Question: What is the distribution of CA issuers for all pages over time? # Note: currently includes HTTP (i.e., pages with no issuer) diff --git a/sql/2025/security/tls_ca_issuers_requests.sql b/sql/2025/security/tls_ca_issuers_requests.sql index e1ee545a776..cc39ba74950 100644 --- a/sql/2025/security/tls_ca_issuers_requests.sql +++ b/sql/2025/security/tls_ca_issuers_requests.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Certificate Authority # Question: What is the distribution of CA issuers for all (top-level) requests? # Note: original query was without is_main_document but due to the port to the tables it suddently took 50+TB instead of 20GB?! diff --git a/sql/2025/security/tls_cipher_suite.sql b/sql/2025/security/tls_cipher_suite.sql index e34b30a4c25..73314cc990b 100644 --- a/sql/2025/security/tls_cipher_suite.sql +++ b/sql/2025/security/tls_cipher_suite.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Cipher suites # Question: What is the distribution of all ciphers for all requests? # Note: Query is large (43TB) diff --git a/sql/2025/security/tls_forward_secrecy.sql b/sql/2025/security/tls_forward_secrecy.sql index ff9ea3e5980..60a36617deb 100644 --- a/sql/2025/security/tls_forward_secrecy.sql +++ b/sql/2025/security/tls_forward_secrecy.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Cipher Suites # Question: How many used cipher suites support forward secrecy for all requests? # Note: Large query (40+TB) diff --git a/sql/2025/security/tls_versions_pages.sql b/sql/2025/security/tls_versions_pages.sql index 303c0aebdcf..bd156b5b594 100644 --- a/sql/2025/security/tls_versions_pages.sql +++ b/sql/2025/security/tls_versions_pages.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Protocol Versions # Question: Which TLS versions are most common on all TLS-enabled web pages? SELECT diff --git a/sql/2025/security/tls_versions_requests.sql b/sql/2025/security/tls_versions_requests.sql index 99a87710ec4..ab4b1cf122b 100644 --- a/sql/2025/security/tls_versions_requests.sql +++ b/sql/2025/security/tls_versions_requests.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Transport Security - Protocol Versions # Question: What is the distribution of TLS versions on all TLS-enabled requests? # Note: Query is large (40TB) diff --git a/sql/2025/security/version-evolution-top-technologies.sql b/sql/2025/security/version-evolution-top-technologies.sql index 89a79defe5d..facf93afa48 100644 --- a/sql/2025/security/version-evolution-top-technologies.sql +++ b/sql/2025/security/version-evolution-top-technologies.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Drivers of security mechanims - Technology stack # Question: Distribution of the different version of the top 20 technologies used on the web. SELECT diff --git a/sql/2025/security/web_cryptography_api.sql b/sql/2025/security/web_cryptography_api.sql index a8757eb3a3b..b6bd30798d3 100644 --- a/sql/2025/security/web_cryptography_api.sql +++ b/sql/2025/security/web_cryptography_api.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack preventions - Web Cryptography API # Question: Which Web Cryptography APIs are used the most? # Note: Possible to port to httparchive.all.pages, however would require to recreate num_urls, total_urls, and pct_urls diff --git a/sql/2025/security/well-known_change-password.sql b/sql/2025/security/well-known_change-password.sql index 8e80364ad40..568c759371f 100644 --- a/sql/2025/security/well-known_change-password.sql +++ b/sql/2025/security/well-known_change-password.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Well-known URIs - change-password # Question What is the prevalence of correctly configured /.well-known/change-password endpoints? # Notes: Safe Cast is required `.data.status` is not always an INT for some reason diff --git a/sql/2025/security/well-known_resource-not-be-200.sql b/sql/2025/security/well-known_resource-not-be-200.sql index 70beb585c0b..ffcc325ed18 100644 --- a/sql/2025/security/well-known_resource-not-be-200.sql +++ b/sql/2025/security/well-known_resource-not-be-200.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Well-known URIs - Detecting Status Code Reliability # Question: What is the prevalence of servers that return a 200 status code where they should not? # Prevalence of /.well-known/resource-that-should-not-exist-whose-status-code-should-not-be-200 counts status codes diff --git a/sql/2025/security/well-known_security.sql b/sql/2025/security/well-known_security.sql index 34c1552c4c4..d70f4d4f5dc 100644 --- a/sql/2025/security/well-known_security.sql +++ b/sql/2025/security/well-known_security.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Well-known URIs - securityt.txt # Question: What is the prevalence of (signed) /.well-known/security.txt endpoints and prevalence of included attributes (canonical, encryption, expires, policy)? # Note: Query is huge (60TB) and computationally expensive (slow) diff --git a/sql/2025/security/xfo_header_prevalence.sql b/sql/2025/security/xfo_header_prevalence.sql index 17fa5906f66..1b25974f97c 100644 --- a/sql/2025/security/xfo_header_prevalence.sql +++ b/sql/2025/security/xfo_header_prevalence.sql @@ -1,4 +1,3 @@ -#standardSQL # Section: Attack Preventions - Security Header Adoptions? # Question: Which are the most common XFO values? # Note: Considers headers of main document responses diff --git a/sql/2025/seo/anchor-rel-attribute-usage-2025.sql b/sql/2025/seo/anchor-rel-attribute-usage-2025.sql index 66c5da4165f..c7de4b3a2ec 100644 --- a/sql/2025/seo/anchor-rel-attribute-usage-2025.sql +++ b/sql/2025/seo/anchor-rel-attribute-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Anchor rel attribute usage # This query reports if a rel attribute value was ever used on a page, and calculates various statistics. diff --git a/sql/2025/seo/anchor-same-site-occurance-stats-2025.sql b/sql/2025/seo/anchor-same-site-occurance-stats-2025.sql index 1784191e88f..94501e7bad4 100644 --- a/sql/2025/seo/anchor-same-site-occurance-stats-2025.sql +++ b/sql/2025/seo/anchor-same-site-occurance-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Anchor same site occurrence stats # This query aims to highlight sites with few same-site links, like SPAs. diff --git a/sql/2025/seo/content-language-2025.sql b/sql/2025/seo/content-language-2025.sql index 8dcc43db12c..486059eed3b 100644 --- a/sql/2025/seo/content-language-2025.sql +++ b/sql/2025/seo/content-language-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Content Language CREATE TEMPORARY FUNCTION getContentLanguagesAlmanac(almanac JSON) diff --git a/sql/2025/seo/fixed-anchor-same-site-occurance-stats-2025.sql b/sql/2025/seo/fixed-anchor-same-site-occurance-stats-2025.sql index 918220a1606..9b1f6336732 100644 --- a/sql/2025/seo/fixed-anchor-same-site-occurance-stats-2025.sql +++ b/sql/2025/seo/fixed-anchor-same-site-occurance-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL -- Anchor same site occurrence stats CREATE TEMPORARY FUNCTION getLinkDesciptions(anchors JSON) diff --git a/sql/2025/seo/hreflang-header-usage-2025.sql b/sql/2025/seo/hreflang-header-usage-2025.sql index d42b74ea205..cb541b8919a 100644 --- a/sql/2025/seo/hreflang-header-usage-2025.sql +++ b/sql/2025/seo/hreflang-header-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # hreflang header usage # Returns all the data we need from _wpt_bodies diff --git a/sql/2025/seo/hreflang-link-tag-usage-2025.sql b/sql/2025/seo/hreflang-link-tag-usage-2025.sql index aff4c35e0a1..4c17c03bbcf 100644 --- a/sql/2025/seo/hreflang-link-tag-usage-2025.sql +++ b/sql/2025/seo/hreflang-link-tag-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # hreflang link tag usage # Returns all the data we need from _wpt_bodies diff --git a/sql/2025/seo/iframe-loading-property-usage-2025.sql b/sql/2025/seo/iframe-loading-property-usage-2025.sql index d4088ef1f3d..eeb5fc78251 100644 --- a/sql/2025/seo/iframe-loading-property-usage-2025.sql +++ b/sql/2025/seo/iframe-loading-property-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Iframe loading property usage # Note: This query only reports if an attribute was ever used on a page. It is not a per iframe report. diff --git a/sql/2025/seo/image-alt-stats-2025.sql b/sql/2025/seo/image-alt-stats-2025.sql index daf5b709ff5..71fa42b9bb8 100644 --- a/sql/2025/seo/image-alt-stats-2025.sql +++ b/sql/2025/seo/image-alt-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Image alt stats # Returns all the data we need from _markup diff --git a/sql/2025/seo/invalid-head-elements-2025.sql b/sql/2025/seo/invalid-head-elements-2025.sql index b6f8132a038..8f767f4f09f 100644 --- a/sql/2025/seo/invalid-head-elements-2025.sql +++ b/sql/2025/seo/invalid-head-elements-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Invalid Head Elements WITH invalid_elements AS ( diff --git a/sql/2025/seo/invalid-head-sites-2025.sql b/sql/2025/seo/invalid-head-sites-2025.sql index 3821eaf0dc5..f081ee76944 100644 --- a/sql/2025/seo/invalid-head-sites-2025.sql +++ b/sql/2025/seo/invalid-head-sites-2025.sql @@ -1,7 +1,5 @@ -#standardSQL # Counted metrics of invalid head elements in HTML -#standardSQL # Counted metrics of invalid head elements in HTML WITH totals AS ( diff --git a/sql/2025/seo/lighthouse-seo-stats-2025.sql b/sql/2025/seo/lighthouse-seo-stats-2025.sql index 2d43dafbc07..6ceb1d90988 100644 --- a/sql/2025/seo/lighthouse-seo-stats-2025.sql +++ b/sql/2025/seo/lighthouse-seo-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL -- Lighthouse SEO Stats CREATE TEMPORARY FUNCTION getAudits(audits JSON) diff --git a/sql/2025/seo/llms-status-2025.sql b/sql/2025/seo/llms-status-2025.sql index 2c41acadf07..bd7a9116896 100644 --- a/sql/2025/seo/llms-status-2025.sql +++ b/sql/2025/seo/llms-status-2025.sql @@ -1,4 +1,3 @@ -#standardSQL -- valid = TRUE means "present" or "exists" WITH labeled AS ( diff --git a/sql/2025/seo/llms-txt-errors-2025.sql b/sql/2025/seo/llms-txt-errors-2025.sql index 76bf75effce..b57ada00c34 100644 --- a/sql/2025/seo/llms-txt-errors-2025.sql +++ b/sql/2025/seo/llms-txt-errors-2025.sql @@ -1,4 +1,3 @@ -#standardSQL -- valid = TRUE means "present" or "exists" -- "errors" are likely validation errors, but may/may not still work diff --git a/sql/2025/seo/mark-up-stats-2025.sql b/sql/2025/seo/mark-up-stats-2025.sql index d7e98255df5..3c5f6240020 100644 --- a/sql/2025/seo/mark-up-stats-2025.sql +++ b/sql/2025/seo/mark-up-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Markup stats diff --git a/sql/2025/seo/media-property-usage-link-tags-rel-alternate-2025.sql b/sql/2025/seo/media-property-usage-link-tags-rel-alternate-2025.sql index 72e6b9f0bc2..594ef61e624 100644 --- a/sql/2025/seo/media-property-usage-link-tags-rel-alternate-2025.sql +++ b/sql/2025/seo/media-property-usage-link-tags-rel-alternate-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Media property usage of link tags with rel=alternate # returns all the data we need from _almanac diff --git a/sql/2025/seo/meta-tag-usage-by-name-2025.sql b/sql/2025/seo/meta-tag-usage-by-name-2025.sql index aaa6797c897..08c892cb0f0 100644 --- a/sql/2025/seo/meta-tag-usage-by-name-2025.sql +++ b/sql/2025/seo/meta-tag-usage-by-name-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Meta tag usage by name # returns all the data we need from _almanac diff --git a/sql/2025/seo/meta-tag-usage-by-property-2025.sql b/sql/2025/seo/meta-tag-usage-by-property-2025.sql index 2e2a6154695..8143e65867b 100644 --- a/sql/2025/seo/meta-tag-usage-by-property-2025.sql +++ b/sql/2025/seo/meta-tag-usage-by-property-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Meta tag usage by property diff --git a/sql/2025/seo/outgoing_links_by_rank-2025.sql b/sql/2025/seo/outgoing_links_by_rank-2025.sql index 44d2c7200a9..1257fd3b7c9 100644 --- a/sql/2025/seo/outgoing_links_by_rank-2025.sql +++ b/sql/2025/seo/outgoing_links_by_rank-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Internal and external link metrics by quantile and rank WITH page_metrics AS ( SELECT diff --git a/sql/2025/seo/pages-canonical-stats-2025.sql b/sql/2025/seo/pages-canonical-stats-2025.sql index 67c99187979..834557bef95 100644 --- a/sql/2025/seo/pages-canonical-stats-2025.sql +++ b/sql/2025/seo/pages-canonical-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # page canonical metrics by device # Note: Contains redundant stats to seo-stats.sql in order to start better segmenting metrics away from monolithic queries. diff --git a/sql/2025/seo/pages-containing-a-video-element-2025.sql b/sql/2025/seo/pages-containing-a-video-element-2025.sql index a0dd7caedc8..76832c23c4d 100644 --- a/sql/2025/seo/pages-containing-a-video-element-2025.sql +++ b/sql/2025/seo/pages-containing-a-video-element-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Pages containing a video element diff --git a/sql/2025/seo/robots-meta-usage-2025.sql b/sql/2025/seo/robots-meta-usage-2025.sql index 61cc46cbdf1..4628d9a2292 100644 --- a/sql/2025/seo/robots-meta-usage-2025.sql +++ b/sql/2025/seo/robots-meta-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Robots meta/header user agent directive usage CREATE TEMPORARY FUNCTION parseRobotsMeta(robotsMetaJson STRING) diff --git a/sql/2025/seo/robots-text-size-2025.sql b/sql/2025/seo/robots-text-size-2025.sql index c773e6a5d6a..32a9fcdce41 100644 --- a/sql/2025/seo/robots-text-size-2025.sql +++ b/sql/2025/seo/robots-text-size-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Robots meta/header user agent directive usage CREATE TEMPORARY FUNCTION parseRobotsMeta(robotsMeta JSON) diff --git a/sql/2025/seo/robots-txt-size-2025.sql b/sql/2025/seo/robots-txt-size-2025.sql index 842cf76aad4..711949376d8 100644 --- a/sql/2025/seo/robots-txt-size-2025.sql +++ b/sql/2025/seo/robots-txt-size-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Robots.txt size SELECT client, diff --git a/sql/2025/seo/robots-txt-status-codes -2025.sql b/sql/2025/seo/robots-txt-status-codes -2025.sql index e54b87c8179..da69d48e2df 100644 --- a/sql/2025/seo/robots-txt-status-codes -2025.sql +++ b/sql/2025/seo/robots-txt-status-codes -2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Robots txt status codes # returns all the data we need from _robots_txt diff --git a/sql/2025/seo/robots-txt-user-agent-usage-2025.sql b/sql/2025/seo/robots-txt-user-agent-usage-2025.sql index 82c93ebdd15..b95852cb71f 100644 --- a/sql/2025/seo/robots-txt-user-agent-usage-2025.sql +++ b/sql/2025/seo/robots-txt-user-agent-usage-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Robots txt user agent usage diff --git a/sql/2025/seo/root-pages-valid-llms-2025.sql b/sql/2025/seo/root-pages-valid-llms-2025.sql index b37fa685b8f..f9cf21f2226 100644 --- a/sql/2025/seo/root-pages-valid-llms-2025.sql +++ b/sql/2025/seo/root-pages-valid-llms-2025.sql @@ -1,4 +1,3 @@ -#standardSQL SELECT client, diff --git a/sql/2025/seo/seo-stats-2025.sql b/sql/2025/seo/seo-stats-2025.sql index 28433d28d35..c64532f3962 100644 --- a/sql/2025/seo/seo-stats-2025.sql +++ b/sql/2025/seo/seo-stats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # SEO stats # Note: Canonical metrics moved to pages-canonical-stats.sql. Should be removed from here in 2022. diff --git a/sql/2025/seo/seo-stats-by-percentile-2025.sql b/sql/2025/seo/seo-stats-by-percentile-2025.sql index cc15669ec8e..7a16fce2657 100644 --- a/sql/2025/seo/seo-stats-by-percentile-2025.sql +++ b/sql/2025/seo/seo-stats-by-percentile-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # SEO stats by percentile # returns all the data we need from _wpt_bodies diff --git a/sql/2025/seo/structured-data-formats-2025.sql b/sql/2025/seo/structured-data-formats-2025.sql index 599281440e1..b7f18518d4c 100644 --- a/sql/2025/seo/structured-data-formats-2025.sql +++ b/sql/2025/seo/structured-data-formats-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Structured data formats # returns all the data we need from _wpt_bodies diff --git a/sql/2025/seo/structured-data-schema-types-2025.sql b/sql/2025/seo/structured-data-schema-types-2025.sql index 3fbf8b0005f..3e7a8ac8e0a 100644 --- a/sql/2025/seo/structured-data-schema-types-2025.sql +++ b/sql/2025/seo/structured-data-schema-types-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Structured data schema types # returns all the data we need from _wpt_bodies diff --git a/sql/2025/seo/test-invalid-head-sites.sql b/sql/2025/seo/test-invalid-head-sites.sql index c3a3d58fc2f..f8517d5ad5d 100644 --- a/sql/2025/seo/test-invalid-head-sites.sql +++ b/sql/2025/seo/test-invalid-head-sites.sql @@ -1,4 +1,3 @@ -#standardSQL # Test query to validate invalid head sites are being detected # This should return non-zero values if the fix is working diff --git a/sql/2025/seo/unused-css-js-2025.sql b/sql/2025/seo/unused-css-js-2025.sql index beedf050b92..e9fcbff7e6e 100644 --- a/sql/2025/seo/unused-css-js-2025.sql +++ b/sql/2025/seo/unused-css-js-2025.sql @@ -1,4 +1,3 @@ -#standardSQL # Unused CSS and JS SELECT diff --git a/sql/2025/sustainability/cache_header_usage.sql b/sql/2025/sustainability/cache_header_usage.sql index 3b8b3781568..211f1a635ea 100644 --- a/sql/2025/sustainability/cache_header_usage.sql +++ b/sql/2025/sustainability/cache_header_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # The distribution of cache header adoption on websites by client. SELECT diff --git a/sql/2025/sustainability/cdn_adoption.sql b/sql/2025/sustainability/cdn_adoption.sql index d0c665f543e..c1c934d6611 100644 --- a/sql/2025/sustainability/cdn_adoption.sql +++ b/sql/2025/sustainability/cdn_adoption.sql @@ -1,4 +1,3 @@ -#standardSQL # The distribution of CDN adoption on websites by client. SELECT diff --git a/sql/2025/sustainability/cms_bytes_per_type.sql b/sql/2025/sustainability/cms_bytes_per_type.sql index ea921ea0838..90a1e64ecc0 100644 --- a/sql/2025/sustainability/cms_bytes_per_type.sql +++ b/sql/2025/sustainability/cms_bytes_per_type.sql @@ -1,4 +1,3 @@ -#standardSQL # Median resource weights by CMS # Declare variables to calculate the carbon emissions of one byte diff --git a/sql/2025/sustainability/content-visibility.sql b/sql/2025/sustainability/content-visibility.sql index b2c9784d573..9a910f3c4e1 100644 --- a/sql/2025/sustainability/content-visibility.sql +++ b/sql/2025/sustainability/content-visibility.sql @@ -1,4 +1,3 @@ -#standardSQL CREATE TEMPORARY FUNCTION HASCONTENTVISIBILITY(css JSON) RETURNS ARRAY> LANGUAGE js diff --git a/sql/2025/sustainability/ecommerce_bytes_per_type.sql b/sql/2025/sustainability/ecommerce_bytes_per_type.sql index 06ecc4b690a..538f91b0c39 100644 --- a/sql/2025/sustainability/ecommerce_bytes_per_type.sql +++ b/sql/2025/sustainability/ecommerce_bytes_per_type.sql @@ -1,4 +1,3 @@ -#standardSQL # Median resource weights by ecommerce platform with detailed CO2e breakdown # Source: https://sustainablewebdesign.org/calculating-digital-emissions/ # Declare variables to calculate the carbon emissions per gigabyte (kWh/GB) diff --git a/sql/2025/sustainability/favicons.sql b/sql/2025/sustainability/favicons.sql index 93f84593c2b..e10c5d01c4d 100644 --- a/sql/2025/sustainability/favicons.sql +++ b/sql/2025/sustainability/favicons.sql @@ -1,4 +1,3 @@ -#standardSQL # Temporary function to extract favicon image extensions from the JSON payload CREATE TEMPORARY FUNCTION GETFAVICONIMAGE(almanac JSON) RETURNS STRING LANGUAGE js AS ''' diff --git a/sql/2025/sustainability/global_emissions_per_page.sql b/sql/2025/sustainability/global_emissions_per_page.sql index fddadfe4dad..56b2c4907a0 100644 --- a/sql/2025/sustainability/global_emissions_per_page.sql +++ b/sql/2025/sustainability/global_emissions_per_page.sql @@ -1,4 +1,3 @@ -#standardSQL # The distribution of page weight by resource type and client, with updated # SWDM v4 methodology including both operational and embodied emissions diff --git a/sql/2025/sustainability/green_third_party_requests.sql b/sql/2025/sustainability/green_third_party_requests.sql index 4318e62ad83..6a9222b248c 100644 --- a/sql/2025/sustainability/green_third_party_requests.sql +++ b/sql/2025/sustainability/green_third_party_requests.sql @@ -1,4 +1,3 @@ -#standardSQL # Median third-parties & green third-party requests per websites by rank WITH third_party_date AS ( diff --git a/sql/2025/sustainability/page_byte_pre_type.sql b/sql/2025/sustainability/page_byte_pre_type.sql index 425eb8d0fa1..40e5f2fba85 100644 --- a/sql/2025/sustainability/page_byte_pre_type.sql +++ b/sql/2025/sustainability/page_byte_pre_type.sql @@ -1,4 +1,3 @@ -#standardSQL -- Energy consumption factors from SWDM v4 (in TWh/ZB) # 290 TWh / 5.29 ZB diff --git a/sql/2025/sustainability/responsive_images.sql b/sql/2025/sustainability/responsive_images.sql index 8cb0cb5f637..20cd6d6face 100644 --- a/sql/2025/sustainability/responsive_images.sql +++ b/sql/2025/sustainability/responsive_images.sql @@ -1,4 +1,3 @@ -#standardSQL # percent of sites using images with srcset w/wo sizes, or picture element WITH page_data AS ( diff --git a/sql/2025/sustainability/script_count.sql b/sql/2025/sustainability/script_count.sql index b98bf00a3bc..238ace85a8b 100644 --- a/sql/2025/sustainability/script_count.sql +++ b/sql/2025/sustainability/script_count.sql @@ -1,4 +1,3 @@ -#standardSQL # Breakdown of inline vs external scripts WITH script_data AS ( SELECT diff --git a/sql/2025/sustainability/ssg_bytes_per_type.sql b/sql/2025/sustainability/ssg_bytes_per_type.sql index b45faf4a6e7..39c7743b0a2 100644 --- a/sql/2025/sustainability/ssg_bytes_per_type.sql +++ b/sql/2025/sustainability/ssg_bytes_per_type.sql @@ -1,4 +1,3 @@ -#standardSQL # Median resource weights by static site generator with detailed CO2e breakdown # Source: https://sustainablewebdesign.org/calculating-digital-emissions/ diff --git a/sql/2025/sustainability/stylesheet_count.sql b/sql/2025/sustainability/stylesheet_count.sql index e8d98032a0a..6893759d968 100644 --- a/sql/2025/sustainability/stylesheet_count.sql +++ b/sql/2025/sustainability/stylesheet_count.sql @@ -1,4 +1,3 @@ -#standardSQL # Breakdown of inline vs external scripts WITH stylesheet_data AS ( SELECT diff --git a/sql/2025/sustainability/unminified_css_bytes.sql b/sql/2025/sustainability/unminified_css_bytes.sql index 4acdbdaa2e7..ec5ab82e98e 100644 --- a/sql/2025/sustainability/unminified_css_bytes.sql +++ b/sql/2025/sustainability/unminified_css_bytes.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution of unminified CSS request bytes per page SELECT diff --git a/sql/2025/sustainability/unminified_js_bytes.sql b/sql/2025/sustainability/unminified_js_bytes.sql index cf6249aa3a9..7b11828cc82 100644 --- a/sql/2025/sustainability/unminified_js_bytes.sql +++ b/sql/2025/sustainability/unminified_js_bytes.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution of unminified JS request bytes per page SELECT diff --git a/sql/2025/sustainability/unused_css_bytes.sql b/sql/2025/sustainability/unused_css_bytes.sql index 5dc4a35d4d4..85ed05cf160 100644 --- a/sql/2025/sustainability/unused_css_bytes.sql +++ b/sql/2025/sustainability/unused_css_bytes.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution of unused CSS request bytes per page SELECT diff --git a/sql/2025/sustainability/unused_js_bytes.sql b/sql/2025/sustainability/unused_js_bytes.sql index 62d41c98fd9..f1114de95ed 100644 --- a/sql/2025/sustainability/unused_js_bytes.sql +++ b/sql/2025/sustainability/unused_js_bytes.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution of unused JS request bytes per page SELECT diff --git a/sql/2025/sustainability/use_of_prefers_dark_mode_usage.sql b/sql/2025/sustainability/use_of_prefers_dark_mode_usage.sql index b62fed0794b..1bbed6926d6 100644 --- a/sql/2025/sustainability/use_of_prefers_dark_mode_usage.sql +++ b/sql/2025/sustainability/use_of_prefers_dark_mode_usage.sql @@ -1,4 +1,3 @@ -#standardSQL # The distribution of websites by client that use the prefers-color-scheme:dark # media query. diff --git a/sql/2025/third-parties/consent_signal_basic_analysis.sql b/sql/2025/third-parties/consent_signal_basic_analysis.sql index aac8ad9dd53..38d16537406 100644 --- a/sql/2025/third-parties/consent_signal_basic_analysis.sql +++ b/sql/2025/third-parties/consent_signal_basic_analysis.sql @@ -1,4 +1,3 @@ -#standardSQL # Basic consent signal analysis (simplified version to ensure data returns) WITH pages AS ( diff --git a/sql/2025/third-parties/consent_signal_prevalence_by_third_party_category.sql b/sql/2025/third-parties/consent_signal_prevalence_by_third_party_category.sql index ca72152d977..1cc6832444c 100644 --- a/sql/2025/third-parties/consent_signal_prevalence_by_third_party_category.sql +++ b/sql/2025/third-parties/consent_signal_prevalence_by_third_party_category.sql @@ -1,4 +1,3 @@ -#standardSQL # Consent signal prevalence broken down by third-party category WITH pages AS ( diff --git a/sql/2025/third-parties/consent_signal_survival_rate_through_chains.sql b/sql/2025/third-parties/consent_signal_survival_rate_through_chains.sql index eb7e2da6163..218912fd3c1 100644 --- a/sql/2025/third-parties/consent_signal_survival_rate_through_chains.sql +++ b/sql/2025/third-parties/consent_signal_survival_rate_through_chains.sql @@ -1,4 +1,3 @@ -#standardSQL # Optimized: Consent signal survival rate through inclusion chains (memory-efficient) CREATE TEMP FUNCTION extractConsentSignals(url STRING) diff --git a/sql/2025/third-parties/consent_signal_survival_rate_through_redirects.sql b/sql/2025/third-parties/consent_signal_survival_rate_through_redirects.sql index f2bc1d609bc..3a68e9e93a2 100644 --- a/sql/2025/third-parties/consent_signal_survival_rate_through_redirects.sql +++ b/sql/2025/third-parties/consent_signal_survival_rate_through_redirects.sql @@ -1,4 +1,3 @@ -#standardSQL # Consent signal survival rate through HTTP redirects (memory-efficient) CREATE TEMP FUNCTION extractConsentSignals(url STRING) diff --git a/sql/2025/third-parties/consent_signals_by_parameter_and_domain_optimized.sql b/sql/2025/third-parties/consent_signals_by_parameter_and_domain_optimized.sql index cbc7da0a4e5..0bcbb4e4522 100644 --- a/sql/2025/third-parties/consent_signals_by_parameter_and_domain_optimized.sql +++ b/sql/2025/third-parties/consent_signals_by_parameter_and_domain_optimized.sql @@ -1,4 +1,3 @@ -#standardSQL # Detailed breakdown of consent signals by individual parameters and top domains WITH pages AS ( diff --git a/sql/2025/third-parties/distribution_of_websites_by_number_of_third_parties.sql b/sql/2025/third-parties/distribution_of_websites_by_number_of_third_parties.sql index 7e2eb6165b6..a564202aaaf 100644 --- a/sql/2025/third-parties/distribution_of_websites_by_number_of_third_parties.sql +++ b/sql/2025/third-parties/distribution_of_websites_by_number_of_third_parties.sql @@ -1,4 +1,3 @@ -#standardSQL # Distribution of websites by number of third party -- updated for crawl.requests diff --git a/sql/2025/third-parties/number_of_third_parties_by_rank.sql b/sql/2025/third-parties/number_of_third_parties_by_rank.sql index 3e858d5c99b..1e046cd6f4f 100644 --- a/sql/2025/third-parties/number_of_third_parties_by_rank.sql +++ b/sql/2025/third-parties/number_of_third_parties_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Number of third-parties per websites by rank WITH requests AS ( diff --git a/sql/2025/third-parties/number_of_third_parties_by_rank_and_category.sql b/sql/2025/third-parties/number_of_third_parties_by_rank_and_category.sql index 0e3e8711004..e4bb0038ee3 100644 --- a/sql/2025/third-parties/number_of_third_parties_by_rank_and_category.sql +++ b/sql/2025/third-parties/number_of_third_parties_by_rank_and_category.sql @@ -1,4 +1,3 @@ -#standardSQL # Number of third-parties per websites by rank and category WITH requests AS ( diff --git a/sql/2025/third-parties/number_of_third_party_providers_by_rank_and_category.sql b/sql/2025/third-parties/number_of_third_party_providers_by_rank_and_category.sql index f786b83715a..572acab9ba1 100644 --- a/sql/2025/third-parties/number_of_third_party_providers_by_rank_and_category.sql +++ b/sql/2025/third-parties/number_of_third_party_providers_by_rank_and_category.sql @@ -1,4 +1,3 @@ -#standardSQL # Number of third-party providers per websites by rank and category WITH requests AS ( diff --git a/sql/2025/third-parties/number_of_third_party_requests_by_rank.sql b/sql/2025/third-parties/number_of_third_party_requests_by_rank.sql index c63c3ba89cb..888f325343f 100644 --- a/sql/2025/third-parties/number_of_third_party_requests_by_rank.sql +++ b/sql/2025/third-parties/number_of_third_party_requests_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Number of third-party requests by rank WITH requests AS ( diff --git a/sql/2025/third-parties/number_of_third_party_requests_per_page_by_rank.sql b/sql/2025/third-parties/number_of_third_party_requests_per_page_by_rank.sql index cfc54316b1b..6b50df1501f 100644 --- a/sql/2025/third-parties/number_of_third_party_requests_per_page_by_rank.sql +++ b/sql/2025/third-parties/number_of_third_party_requests_per_page_by_rank.sql @@ -1,4 +1,3 @@ -#standardSQL # Number of third-party requests per page by rank WITH requests AS ( diff --git a/sql/2025/third-parties/percent_of_third_parties_by_content_type.sql b/sql/2025/third-parties/percent_of_third_parties_by_content_type.sql index 18481200c68..206d071ba08 100644 --- a/sql/2025/third-parties/percent_of_third_parties_by_content_type.sql +++ b/sql/2025/third-parties/percent_of_third_parties_by_content_type.sql @@ -1,4 +1,3 @@ -#standardSQL # Percent of third party requests by content type. WITH requests AS ( diff --git a/sql/2025/third-parties/percent_of_websites_with_third_party_by_ranking.sql b/sql/2025/third-parties/percent_of_websites_with_third_party_by_ranking.sql index ee4ff6a1052..7e7a91e733d 100644 --- a/sql/2025/third-parties/percent_of_websites_with_third_party_by_ranking.sql +++ b/sql/2025/third-parties/percent_of_websites_with_third_party_by_ranking.sql @@ -1,4 +1,3 @@ -#standardSQL # Percent of websites with third parties by ranking WITH requests AS ( diff --git a/sql/2025/third-parties/prevalence_of_consent_signals_in_third_party_requests_optimized.sql b/sql/2025/third-parties/prevalence_of_consent_signals_in_third_party_requests_optimized.sql index 580c8df3002..37eed08d6b8 100644 --- a/sql/2025/third-parties/prevalence_of_consent_signals_in_third_party_requests_optimized.sql +++ b/sql/2025/third-parties/prevalence_of_consent_signals_in_third_party_requests_optimized.sql @@ -1,4 +1,3 @@ -#standardSQL # Prevalence of specific consent signals (USP, TCF, GPP) in third-party requests WITH pages AS ( diff --git a/sql/2025/third-parties/top100_third_parties_by_number_of_websites.sql b/sql/2025/third-parties/top100_third_parties_by_number_of_websites.sql index dc915aa07d8..475a9d85a48 100644 --- a/sql/2025/third-parties/top100_third_parties_by_number_of_websites.sql +++ b/sql/2025/third-parties/top100_third_parties_by_number_of_websites.sql @@ -1,4 +1,3 @@ -#standardSQL # Top 100 third parties by number of websites WITH requests AS ( From 097f21e312cea6a61c06ffb5a228c7e68113cef7 Mon Sep 17 00:00:00 2001 From: Max Ostapenko <1611259+max-ostapenko@users.noreply.github.com> Date: Sun, 1 Mar 2026 19:01:22 +0100 Subject: [PATCH 2/3] removed space in filename --- ...xt-status-codes -2025.sql => robots-txt-status-codes-2025.sql} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename sql/2025/seo/{robots-txt-status-codes -2025.sql => robots-txt-status-codes-2025.sql} (100%) diff --git a/sql/2025/seo/robots-txt-status-codes -2025.sql b/sql/2025/seo/robots-txt-status-codes-2025.sql similarity index 100% rename from sql/2025/seo/robots-txt-status-codes -2025.sql rename to sql/2025/seo/robots-txt-status-codes-2025.sql From cc170e1504873a835c6347264cc9531f41234d26 Mon Sep 17 00:00:00 2001 From: Max Ostapenko <1611259+max-ostapenko@users.noreply.github.com> Date: Sun, 1 Mar 2026 19:07:55 +0100 Subject: [PATCH 3/3] lint --- sql/2025/accessibility/media_query_features.sql | 1 - sql/2025/accessibility/units_properties.sql | 1 - sql/2025/seo/llms-status-2025.sql | 1 - sql/2025/seo/llms-txt-errors-2025.sql | 1 - sql/2025/seo/root-pages-valid-llms-2025.sql | 1 - sql/2025/sustainability/page_byte_pre_type.sql | 1 - sql/2025/sustainability/ssg_bytes_per_type.sql | 1 - 7 files changed, 7 deletions(-) diff --git a/sql/2025/accessibility/media_query_features.sql b/sql/2025/accessibility/media_query_features.sql index 764365e9e69..cc351ac967e 100644 --- a/sql/2025/accessibility/media_query_features.sql +++ b/sql/2025/accessibility/media_query_features.sql @@ -1,4 +1,3 @@ - CREATE TEMPORARY FUNCTION getMediaQueryFeatures(css JSON) RETURNS ARRAY LANGUAGE js diff --git a/sql/2025/accessibility/units_properties.sql b/sql/2025/accessibility/units_properties.sql index 92993769613..e08c62de5b0 100644 --- a/sql/2025/accessibility/units_properties.sql +++ b/sql/2025/accessibility/units_properties.sql @@ -1,4 +1,3 @@ - CREATE TEMPORARY FUNCTION getPropertyUnits(css JSON) RETURNS ARRAY> LANGUAGE js diff --git a/sql/2025/seo/llms-status-2025.sql b/sql/2025/seo/llms-status-2025.sql index bd7a9116896..d43545cfdac 100644 --- a/sql/2025/seo/llms-status-2025.sql +++ b/sql/2025/seo/llms-status-2025.sql @@ -1,4 +1,3 @@ - -- valid = TRUE means "present" or "exists" WITH labeled AS ( SELECT diff --git a/sql/2025/seo/llms-txt-errors-2025.sql b/sql/2025/seo/llms-txt-errors-2025.sql index b57ada00c34..374d1129481 100644 --- a/sql/2025/seo/llms-txt-errors-2025.sql +++ b/sql/2025/seo/llms-txt-errors-2025.sql @@ -1,4 +1,3 @@ - -- valid = TRUE means "present" or "exists" -- "errors" are likely validation errors, but may/may not still work WITH found AS ( diff --git a/sql/2025/seo/root-pages-valid-llms-2025.sql b/sql/2025/seo/root-pages-valid-llms-2025.sql index f9cf21f2226..1554081d450 100644 --- a/sql/2025/seo/root-pages-valid-llms-2025.sql +++ b/sql/2025/seo/root-pages-valid-llms-2025.sql @@ -1,4 +1,3 @@ - SELECT client, COUNTIF(SAFE_CAST(JSON_VALUE(custom_metrics.other.llms_txt_validation.valid) AS BOOL)) AS valid_llms, diff --git a/sql/2025/sustainability/page_byte_pre_type.sql b/sql/2025/sustainability/page_byte_pre_type.sql index 40e5f2fba85..06473cf9ff6 100644 --- a/sql/2025/sustainability/page_byte_pre_type.sql +++ b/sql/2025/sustainability/page_byte_pre_type.sql @@ -1,4 +1,3 @@ - -- Energy consumption factors from SWDM v4 (in TWh/ZB) # 290 TWh / 5.29 ZB DECLARE ENERGY_PER_GB_DATACENTER NUMERIC DEFAULT 0.00006829493087557603; diff --git a/sql/2025/sustainability/ssg_bytes_per_type.sql b/sql/2025/sustainability/ssg_bytes_per_type.sql index 39c7743b0a2..b64ea969f68 100644 --- a/sql/2025/sustainability/ssg_bytes_per_type.sql +++ b/sql/2025/sustainability/ssg_bytes_per_type.sql @@ -1,4 +1,3 @@ - # Median resource weights by static site generator with detailed CO2e breakdown # Source: https://sustainablewebdesign.org/calculating-digital-emissions/ # Declare variables to calculate the carbon emissions per gigabyte (kWh/GB)