{
  "openapi": "3.0.1",
  "info": {
    "title": "CORE Open Access Paper Search",
    "description": "Search and extract open access academic papers from CORE -- the world's largest aggregator of open access research with over 300 million metadata records and 40+ million full-text papers. Filter by keyword, year range, and language.",
    "version": "2.0",
    "x-build-id": "sxcCEnWORPe3lYC6u"
  },
  "servers": [
    {
      "url": "https://api.apify.com/v2"
    }
  ],
  "paths": {
    "/acts/ryanclinton~core-academic-search/run-sync-get-dataset-items": {
      "post": {
        "operationId": "run-sync-get-dataset-items-ryanclinton-core-academic-search",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor, waits for its completion, and returns Actor's dataset items in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK"
          }
        }
      }
    },
    "/acts/ryanclinton~core-academic-search/runs": {
      "post": {
        "operationId": "runs-sync-ryanclinton-core-academic-search",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor and returns information about the initiated run in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK",
            "content": {
              "application/json": {
                "schema": {
                  "$ref": "#/components/schemas/runsResponseSchema"
                }
              }
            }
          }
        }
      }
    },
    "/acts/ryanclinton~core-academic-search/run-sync": {
      "post": {
        "operationId": "run-sync-ryanclinton-core-academic-search",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor, waits for completion, and returns the OUTPUT from Key-value store in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK"
          }
        }
      }
    }
  },
  "components": {
    "schemas": {
      "inputSchema": {
        "type": "object",
        "required": [
          "query"
        ],
        "properties": {
          "apiKey": {
            "title": "CORE API Key",
            "type": "string",
            "description": "Your free CORE API key. Register at https://core.ac.uk/services/api to get one."
          },
          "query": {
            "title": "Search Query",
            "type": "string",
            "description": "Keywords to search across titles, abstracts, and full text. Supports Boolean operators (AND, OR, NOT) directly.",
            "default": "artificial intelligence"
          },
          "researchPreset": {
            "title": "Research Preset",
            "enum": [
              "none",
              "literature-review",
              "state-of-the-art",
              "historical-foundations",
              "thesis-sources",
              "monitoring"
            ],
            "type": "string",
            "description": "One-pick research intent that sets sensible defaults for the gate, dedupe, filters, and monitoring. Your own explicit settings always override the preset. literature-review: read-ready, de-duplicated, grade B+ with PDF verification. state-of-the-art: recent (<=3y) and already cited (>=25). historical-foundations: highly cited (>=100). thesis-sources: theses only. monitoring: emit only changed papers across runs.",
            "default": "none"
          },
          "exactPhrases": {
            "title": "Exact Phrases",
            "type": "array",
            "description": "Phrases that must appear verbatim (each is matched as an exact phrase).",
            "items": {
              "type": "string"
            }
          },
          "mustInclude": {
            "title": "Must Include (all)",
            "type": "array",
            "description": "Terms that must all be present in the results.",
            "items": {
              "type": "string"
            }
          },
          "mustExclude": {
            "title": "Must Exclude",
            "type": "array",
            "description": "Terms to exclude from results (e.g. 'survey', 'review').",
            "items": {
              "type": "string"
            }
          },
          "titleOnly": {
            "title": "Match Query in Title Only",
            "type": "boolean",
            "description": "Restrict the main query to paper titles instead of full text.",
            "default": false
          },
          "author": {
            "title": "Author Name",
            "type": "string",
            "description": "Filter to papers by an author whose name matches this value."
          },
          "publisher": {
            "title": "Publisher",
            "type": "string",
            "description": "Filter to papers from a specific publisher."
          },
          "minCitations": {
            "title": "Minimum Citations",
            "minimum": 0,
            "type": "integer",
            "description": "Only return papers with at least this many citations."
          },
          "yearFrom": {
            "title": "Year From",
            "type": "integer",
            "description": "Filter papers published from this year onwards."
          },
          "yearTo": {
            "title": "Year To",
            "type": "integer",
            "description": "Filter papers published up to this year."
          },
          "language": {
            "title": "Language",
            "type": "string",
            "description": "Filter by language code (e.g., 'en' for English, 'de' for German)."
          },
          "fullTextOnly": {
            "title": "Full Text Only",
            "type": "boolean",
            "description": "Only return papers that have a downloadable full text PDF.",
            "default": false
          },
          "documentTypes": {
            "title": "Document Types",
            "type": "array",
            "description": "Keep only papers whose document type matches one of these (e.g. 'research', 'thesis', 'preprint'). Applied after fetch.",
            "items": {
              "type": "string"
            }
          },
          "repository": {
            "title": "Repository Contains",
            "type": "string",
            "description": "Keep only papers hosted by a repository whose name contains this text (e.g. 'arXiv', 'Strathclyde'). Applied after fetch."
          },
          "maxResults": {
            "title": "Max Results",
            "maximum": 500,
            "type": "integer",
            "description": "Maximum number of papers to return (up to 500).",
            "default": 50
          },
          "pdfVerification": {
            "title": "Full-text Verification",
            "enum": [
              "none",
              "url-present",
              "head-check"
            ],
            "type": "string",
            "description": "none: no check. url-present: flag whether a download URL exists (no network call). head-check: live HEAD request per PDF to confirm it is downloadable now (adds one request per paper).",
            "default": "none"
          },
          "qualityGate": {
            "title": "Quality Gate",
            "type": "object",
            "description": "Acceptance criteria object, e.g. { \"minGrade\": \"B\", \"requirePdf\": true, \"minCitations\": 5, \"maxAgeYears\": 8, \"excludeDuplicates\": true }."
          },
          "dropFiltered": {
            "title": "Drop Gate-Failing Papers",
            "type": "boolean",
            "description": "When the quality gate is set, exclude dropped papers from the dataset (still counted in the corpus summary).",
            "default": false
          },
          "dedupeMode": {
            "title": "Deduplication Mode",
            "enum": [
              "none",
              "doi",
              "strict",
              "fuzzy"
            ],
            "type": "string",
            "description": "none: off. doi: DOI exact match. strict: DOI or normalized title+author+year. fuzzy: strict plus near-identical title detection.",
            "default": "doi"
          },
          "watchlistName": {
            "title": "Watchlist Name (monitoring)",
            "type": "string",
            "description": "Name a watchlist to track papers across runs. Each paper is flagged NEW the first time it appears, SEEN afterwards, with changedFields (citationCount, retrievability, becameReadable). Leave blank for one-off searches."
          },
          "watchlistMode": {
            "title": "Watchlist Output Mode",
            "enum": [
              "flag-all",
              "new-only",
              "changed-only"
            ],
            "type": "string",
            "description": "flag-all: emit every paper with its watchlist status. new-only: emit only papers new since the last run. changed-only: emit only new or changed papers.",
            "default": "flag-all"
          },
          "compareQuery": {
            "title": "Compare Query (benchmark)",
            "type": "string",
            "description": "Optional. A second query to benchmark against the main query. Emits a 'benchmark' record comparing the two corpora on health score (PDF availability, readiness, de-duplication). Runs a second CORE search."
          },
          "outputMode": {
            "title": "Output Mode",
            "enum": [
              "papers",
              "corpus",
              "benchmark"
            ],
            "type": "string",
            "description": "papers: one record per paper plus a corpus-summary digest. corpus: suppress per-paper rows and return only the run-level corpus-summary digest — charged as a single event. benchmark: compare your query against compareQuery on corpus health and return only a head-to-head comparison table — charged as a single event (requires compareQuery).",
            "default": "papers"
          },
          "outputProfile": {
            "title": "Output Profile",
            "enum": [
              "minimal",
              "standard",
              "full"
            ],
            "type": "string",
            "description": "minimal: headline decision fields only. standard: adds authors, citations, repositories, recency, provenance. full: every field including abstract, scoring breakdown, and all source URLs.",
            "default": "standard"
          }
        }
      },
      "runsResponseSchema": {
        "type": "object",
        "properties": {
          "data": {
            "type": "object",
            "properties": {
              "id": {
                "type": "string"
              },
              "actId": {
                "type": "string"
              },
              "userId": {
                "type": "string"
              },
              "startedAt": {
                "type": "string",
                "format": "date-time",
                "example": "2025-01-08T00:00:00.000Z"
              },
              "finishedAt": {
                "type": "string",
                "format": "date-time",
                "example": "2025-01-08T00:00:00.000Z"
              },
              "status": {
                "type": "string",
                "example": "READY"
              },
              "meta": {
                "type": "object",
                "properties": {
                  "origin": {
                    "type": "string",
                    "example": "API"
                  },
                  "userAgent": {
                    "type": "string"
                  }
                }
              },
              "stats": {
                "type": "object",
                "properties": {
                  "inputBodyLen": {
                    "type": "integer",
                    "example": 2000
                  },
                  "rebootCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "restartCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "resurrectCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "computeUnits": {
                    "type": "integer",
                    "example": 0
                  }
                }
              },
              "options": {
                "type": "object",
                "properties": {
                  "build": {
                    "type": "string",
                    "example": "latest"
                  },
                  "timeoutSecs": {
                    "type": "integer",
                    "example": 300
                  },
                  "memoryMbytes": {
                    "type": "integer",
                    "example": 1024
                  },
                  "diskMbytes": {
                    "type": "integer",
                    "example": 2048
                  }
                }
              },
              "buildId": {
                "type": "string"
              },
              "defaultKeyValueStoreId": {
                "type": "string"
              },
              "defaultDatasetId": {
                "type": "string"
              },
              "defaultRequestQueueId": {
                "type": "string"
              },
              "buildNumber": {
                "type": "string",
                "example": "1.0.0"
              },
              "containerUrl": {
                "type": "string"
              },
              "usage": {
                "type": "object",
                "properties": {
                  "ACTOR_COMPUTE_UNITS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_WRITES": {
                    "type": "integer",
                    "example": 1
                  },
                  "KEY_VALUE_STORE_LISTS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_INTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_EXTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_SERPS": {
                    "type": "integer",
                    "example": 0
                  }
                }
              },
              "usageTotalUsd": {
                "type": "number",
                "example": 0.00005
              },
              "usageUsd": {
                "type": "object",
                "properties": {
                  "ACTOR_COMPUTE_UNITS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_WRITES": {
                    "type": "number",
                    "example": 0.00005
                  },
                  "KEY_VALUE_STORE_LISTS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_INTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_EXTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_SERPS": {
                    "type": "integer",
                    "example": 0
                  }
                }
              }
            }
          }
        }
      }
    }
  }
}