ContentMine · tarrow · Aug 18, 2016 · May 26, 2014 · May 27, 2014 · May 27, 2014
diff --git a/scrapers/apa.json b/scrapers/apa.json
diff --git a/scrapers/bmc.json b/scrapers/bmc.json
@@ -1,5 +1,9 @@
 {
+<<<<<<< HEAD
+"url": "www\\.biomedcentral\\.com",
+=======
 "url": "biomedcentral\\.com",
+>>>>>>> 5ba53bf6d08fc9d102cccc623c5511502f7711c1
 "elements": {
 "publisher": {
 "selector": "//meta[@name='citation_publisher']",
@@ -38,11 +42,19 @@
 "attribute": "content"
 },
 "description": {
+<<<<<<< HEAD
+"selector": "//meta[@name='description']",
+"attribute": "content"
+},
+"abstract": {
+"selector": "//meta[@name='description']",
+=======
 "selector": "//meta[@name='dc.description']",
 "attribute": "content"
 },
 "abstract": {
 "selector": "//meta[@name='dc.description']",
+>>>>>>> 5ba53bf6d08fc9d102cccc623c5511502f7711c1
 "attribute": "content"
 },
 "fulltext_html": {
@@ -59,17 +71,46 @@
 "rename": "fulltext.pdf"
 }
 },
+<<<<<<< HEAD
+"fulltext_xml": {
+"selector": "//a[.='Download XML']",
+"attribute": "href",
+"download": {
+"rename": "fulltext.xml"
+}
+},
+"supplementary_material": {
+"selector": "//link[starts-with(@title,'Additional file')]",
+=======
 "supplementary_material": {
 "selector": "//a[@class='filename']",
+>>>>>>> 5ba53bf6d08fc9d102cccc623c5511502f7711c1
 "attribute": "href",
 "download": true
 },
 "figure": {
+<<<<<<< HEAD
+"selector": "//div[@class='fig']/p/a/img",
+=======
 "selector": "//figure[@class='Figure']/div/img",
+>>>>>>> 5ba53bf6d08fc9d102cccc623c5511502f7711c1
 "attribute": "src",
 "download": true
 },
 "figure_caption": {
+<<<<<<< HEAD
+"selector": "//div[@class='fig']//strong"
+},
+"license": {
+"selector": "//p[a/@href='http://creativecommons.org/licenses/by/4.0']"
+},
+"copyright": {
+"selector": "//p[contains(.,'licensee')]"
+}
+}
+}
+
+=======
 "selector": "//figure[@class='Figure']/figcaption"
 },
 "license": {
@@ -81,3 +122,4 @@
 }
 }
 }
+>>>>>>> 5ba53bf6d08fc9d102cccc623c5511502f7711c1
diff --git a/scrapers/elsevier.json b/scrapers/elsevier.json
@@ -0,0 +1,25 @@
+{
+  "url": "sciencedirect\\.com",
+  "elements": {
+    "title": {
+      "selector": "/html/head/title",
+      "attribute": "content"
+    },
+    "fulltext_html": {
+      "selector": "//link[contains(@rel, 'canonical')]",
+      "attribute": "href",
+      "download": {
+        "rename": "fulltext.html"
+      }
+    },
+
+    "fulltext_pdf": {
+      "selector": "//*[contains(@id, 'pdfLink')]",
+      "attribute": "href",
+      "download": {
+        "rename": "fulltext.pdf"
+      }
+    }
+  }
+}
+
diff --git a/scrapers/sage.json b/scrapers/sage.json
@@ -1,11 +1,13 @@
 {
+
   "url": ".*sagepub.*\\.com",
   "headless": true,
   "elements": {
     "publisher": {
       "selector": "//meta[@name='DC.Publisher']",
       "attribute": "content"
     },
+
     "title": {
       "selector": "//meta[@name='DC.Title']",
       "attribute": "content"
@@ -15,24 +17,28 @@
       "attribute": "content"
     },
     "date": {
-      "selector": "//meta[@name='citation_online_date']",
+      "selector": "//meta[@name='DC.Date']",
       "attribute": "content"
     },
+
     "doi": {
       "selector": "//meta[@name='citation_doi']",
       "attribute": "content"
     },
+
     "issn": {
       "selector": "//meta[@name='citation_issn']",
       "attribute": "content"
     },
+
     "fulltext_pdf": {
       "selector": "//meta[@name='citation_pdf_url']",
       "attribute": "content",
       "download": {
         "rename": "fulltext.pdf"
       }
     },
+
     "fulltext_html": {
       "selector": "//meta[@name='citation_fulltext_html_url']",
       "attribute": "content",
@@ -41,4 +47,4 @@
       }
     }
   }
-}
+}
diff --git a/scrapers/springer.json b/scrapers/springer.json
@@ -1,4 +1,4 @@
-{
+  {
   "url": ".*springer.*\\.com",
   "headless": true,
   "elements": {
@@ -10,6 +10,7 @@
       "selector": "//meta[@name='citation_title']",
       "attribute": "content"
     },
+
     "authors": {
       "selector": "//meta[@name='citation_author']",
       "attribute": "content"
@@ -18,10 +19,12 @@
       "selector": "//meta[@name='citation_online_date']",
       "attribute": "content"
     },
+
     "doi": {
       "selector": "//meta[@name='citation_doi']",
       "attribute": "content"
     },
+
     "issn": {
       "selector": "//meta[@name='citation_issn']",
       "attribute": "content"
@@ -33,6 +36,7 @@
         "rename": "fulltext.pdf"
       }
     },
+
     "fulltext_html": {
       "selector": "//meta[@name='citation_fulltext_html_url']",
       "attribute": "content",