Duplicate Pages inc Non Indexable
Pages that share an identical title, description and near identical content with other pages found in the same crawl, excluding the Primary page from each set of duplicates. The page with the highest DeepRank is selected as the Primary in each set of duplicates.
Priority: None
Impact: Neutral
How to fetch the data for this report template
You will need to run a crawl for report template to generate report. When report has been generated and you have crawl id you can fetch data for the report using the following query:
- Query
- Variables
- cURL
query GetReportStatForCrawl(
$crawlId: ObjectID!
$reportTemplateCode: String!
$after: String
) {
getReportStat(
input: {crawlId: $crawlId, reportTemplateCode: $reportTemplateCode}
) {
crawlUrls(after: $after, reportType: Basic) {
nodes {
pageTitle
url
primaryUrl
foundAtUrl
duplicatePageCount
deeprank
level
duplicateTitle
duplicateTitlePrimaryUrl
duplicateTitleNonIndexable
duplicateBody
duplicateBodyPrimaryUrl
duplicateBodyNonIndexable
duplicateDescription
duplicateDescriptionPrimaryUrl
duplicateDescriptionNonIndexable
foundInGoogleAnalytics
foundInGoogleSearchConsole
foundInBacklinks
foundInList
foundInLogSummary
foundInWebCrawl
foundInSitemap
}
totalCount
pageInfo {
endCursor
hasNextPage
}
}
}
}
{"crawlId":"TjAwNUNyYXdsNDAwMA","reportTemplateCode":"duplicate_pages_inc_non_indexable"}
curl -X POST -H "Content-Type: application/json" -H "apollographql-client-name: docs-example-client" -H "apollographql-client-version: 1.0.0" -H "x-auth-token: YOUR_API_SESSION_TOKEN" --data '{"query":"query GetReportStatForCrawl( $crawlId: ObjectID! $reportTemplateCode: String! $after: String ) { getReportStat( input: {crawlId: $crawlId, reportTemplateCode: $reportTemplateCode} ) { crawlUrls(after: $after, reportType: Basic) { nodes { pageTitle url primaryUrl foundAtUrl duplicatePageCount deeprank level duplicateTitle duplicateTitlePrimaryUrl duplicateTitleNonIndexable duplicateBody duplicateBodyPrimaryUrl duplicateBodyNonIndexable duplicateDescription duplicateDescriptionPrimaryUrl duplicateDescriptionNonIndexable foundInGoogleAnalytics foundInGoogleSearchConsole foundInBacklinks foundInList foundInLogSummary foundInWebCrawl foundInSitemap } totalCount pageInfo { endCursor hasNextPage } } } }","variables":{"crawlId":"TjAwNUNyYXdsNDAwMA","reportTemplateCode":"duplicate_pages_inc_non_indexable"}}' https://api.lumar.io/graphql