From f49e5870a2a2ad8cb34a1b20785fd4f402f8133e Mon Sep 17 00:00:00 2001 From: Gabriel Reimers Date: Fri, 23 Sep 2016 17:56:40 +0200 Subject: [PATCH] - adds RISM demo crawler --- command_line_scripts/indexRISM.php | 40 ++++++++++++++++++++++++++++++ src/RISMIncipitCrawler.php | 2 +- 2 files changed, 41 insertions(+), 1 deletion(-) create mode 100644 command_line_scripts/indexRISM.php diff --git a/command_line_scripts/indexRISM.php b/command_line_scripts/indexRISM.php new file mode 100644 index 0000000..3e1a8d1 --- /dev/null +++ b/command_line_scripts/indexRISM.php @@ -0,0 +1,40 @@ +createIndex(); +$crawler->crawlCatalog(); \ No newline at end of file diff --git a/src/RISMIncipitCrawler.php b/src/RISMIncipitCrawler.php index 5266d23..a9fee24 100644 --- a/src/RISMIncipitCrawler.php +++ b/src/RISMIncipitCrawler.php @@ -112,7 +112,7 @@ public function crawlCatalog() { $startID = 400110660; - $endID = 400110862; + $endID = 400110999; for ($i = $startID; $i < $endID; $i++) { $url = "https://opac.rism.info/id/rismid/" . $i . "?format=marc";