Blue Frog Keyspace Schema
The blue_frog
keyspace mirrors the domain_discovery
layout but stores every collection type as plain TEXT
containing JSON. This allows older clients to query data without Cassandra collection type issues. Primary keys match the original tables.
Tables
certstream_domains
domain
text PRIMARY KEY
domains_processed
domain
texttld
textregistered
timestampregistrar
textupdated
timestampstatus
textas_name
textas_number
intisp
textorg
textcity
textregion
textregion_name
textcountry
textcountry_code
textcontinent
textcontinent_code
textlat
floatlon
floatlanguages
textphone
texttime_zone
textssl_issuer
textssl_org
textx_powered_by
texttech_detect
textwordpress_asset_version
textsite_type
textsite_category
textsite_type_tags
texttitle
textdescription
textlinkedin_url
texthas_about_page
booleanhas_services_page
booleanhas_cart_or_product
booleanmore_than_5_internal_links
booleancontains_gtm_or_ga
booleanwordpress_version
textserver_type
textserver_version
textwpjson_size_bytes
intwpjson_contains_cart
booleanemails
textphone_numbers
textsms_numbers
textaddresses
textfavicon_url
textrobots_txt_exists
booleanrobots_txt_content
textcanonical_url
texth1_count
inth2_count
inth3_count
intschema_markup_detected
booleanschema_types
textsecurity_headers_score
intsecurity_headers_detected
texthsts_enabled
booleancookie_compliance
booleanthird_party_scripts
intcolor_contrast_issues
intaria_landmark_count
intform_accessibility_issues
intsocial_media_profiles
textrss_feed_detected
booleannewsletter_signup_detected
booleancdn_detected
booleanhttp_version
textcompression_enabled
booleancache_control_headers
textpage_weight_bytes
intmain_language
textcontent_keywords
textecommerce_platforms
textsitemap_page_count
intpostal_code
textmeta_tag_count
intsitemap_robots_conflict
booleaninsecure_cookie_count
intexternal_resource_count
intpassive_subdomain_count
intopen_ports
textallowed_http_methods
textwaf_name
textdirectory_scan
textcertificate_info
textdesktop_accessibility_score
intmobile_accessibility_score
intdesktop_best_practices_score
intmobile_best_practices_score
intdesktop_performance_score
intmobile_performance_score
intdesktop_seo_score
intmobile_seo_score
intdesktop_first_contentful_paint
floatmobile_first_contentful_paint
floatdesktop_largest_contentful_paint
floatmobile_largest_contentful_paint
floatdesktop_interactive
floatmobile_interactive
floatdesktop_speed_index
floatmobile_speed_index
floatdesktop_total_blocking_time
floatmobile_total_blocking_time
floatdesktop_cumulative_layout_shift
floatmobile_cumulative_layout_shift
floatdesktop_timing_total
floatmobile_timing_total
floatlighthouse_version
textlighthouse_fetch_time
timestamplighthouse_url
textraw_subdomains
textdesktop_performance_suggestions
textmobile_performance_suggestions
textdesktop_accessibility_suggestions
textmobile_accessibility_suggestions
textdesktop_seo_suggestions
textmobile_seo_suggestions
textuser_managed
booleanrefresh_hours
intlast_enriched
timestamp- PRIMARY KEY (
domain
,tld
)
domain_page_metrics
domain
texturl
textscan_date
timestampdesktop_accessibility_score
intmobile_accessibility_score
intdesktop_best_practices_score
intmobile_best_practices_score
intdesktop_performance_score
intmobile_performance_score
intdesktop_seo_score
intmobile_seo_score
intdesktop_first_contentful_paint
floatmobile_first_contentful_paint
floatdesktop_largest_contentful_paint
floatmobile_largest_contentful_paint
floatdesktop_interactive
floatmobile_interactive
floatdesktop_speed_index
floatmobile_speed_index
floatdesktop_total_blocking_time
floatmobile_total_blocking_time
floatdesktop_cumulative_layout_shift
floatmobile_cumulative_layout_shift
floatdesktop_timing_total
floatmobile_timing_total
floatlighthouse_version
textlighthouse_fetch_time
timestamplighthouse_url
textdesktop_performance_suggestions
textmobile_performance_suggestions
textdesktop_accessibility_suggestions
textmobile_accessibility_suggestions
textdesktop_seo_suggestions
textmobile_seo_suggestions
textstatus_code
intredirect_chain
textpage_load_time_ms
intbroken_links_count
intinternal_links_count
intexternal_links_count
intpage_images_count
intmissing_alt_text_images_count
intvideo_embeds_count
intiframe_embeds_count
intduplicate_meta_titles
booleanduplicate_meta_descriptions
booleanemails
textphone_numbers
textsms_numbers
textaddresses
textwpt_load_time_ms
intwpt_speed_index
floatwpt_ttfb_ms
intscreenshot_path
textheatmap_path
text- PRIMARY KEY (
domain
,url
,scan_date
)
analytics_tag_health
domain
textscan_date
timestampworking_variants
textscanned_urls
textfound_analytics
textpage_results
textvariant_results
textcompliance_status
text- PRIMARY KEY (
domain
,scan_date
)
carbon_audits
domain
texturl
textscan_date
timestampbytes
intco2
float- PRIMARY KEY (
domain
,url
,scan_date
)
dns_records
domain
textrecord_type
textrecord_value
textscan_date
timestamp- PRIMARY KEY ((
domain
,record_type
),record_value
,scan_date
)
misc_tool_results
domain
texturl
texttool_name
textscan_date
timestampdata
text- PRIMARY KEY (
domain
,url
,tool_name
,scan_date
)
businesses
name
textaddress
textwebsite
textphone
textreviews_average
floatquery
textlatitude
floatlongitude
float- PRIMARY KEY (
name
,address
)
tracking_specs
category
texttool
textname
textrule
textexample
textdescription
textupdated_at
timestamp- PRIMARY KEY ((
category
,tool
),name
)