freelawproject · mlissner · Feb 1, 2017 · Feb 1, 2017 · Feb 1, 2017
diff --git a/juriscraper/opinions/united_states/state/__init__.py b/juriscraper/opinions/united_states/state/__init__.py
@@ -65,6 +65,7 @@
     'michctapp_p',
     'michctapp_u',
     'minn',
+    'minnag',
     'minnctapp',
     'miss_beginningofyear',
     'miss',

diff --git a/juriscraper/opinions/united_states/state/minnag.py b/juriscraper/opinions/united_states/state/minnag.py
@@ -0,0 +1,56 @@
+"""Scraper for Minnesota Attorney General Opinions
+CourtID: minnag
+Court Short Name: MN
+Author: David Cook
+Reviewer:
+"""
+
+import re
+from lxml import html
+
+from juriscraper.OpinionSite import OpinionSite
+from juriscraper.lib.string_utils import convert_date_string
+
+
+class Site(OpinionSite):
+    def __init__(self, *args, **kwargs):
+        super(Site, self).__init__(*args, **kwargs)
+        self.court_id = self.__module__
+        self.domain = 'http://www.ag.state.mn.us'
+        self.url = 'http://www.ag.state.mn.us/office/opinions/DATE.asp'
+        self.opinions = []
+
+    def _download(self, request_dict={}):
+        html = super(Site, self)._download(request_dict)
+        self._extract_case_data_from_html(html)
+        return html
+
+    def _extract_case_data_from_html(self, html):
+        for p in html.xpath("//div[@id='content']/div[@id='op']/p"):
+            name = p.xpath('a/strong/following-sibling::text()[1]')[0].split(u"\u2014", 1)[1]
+            name = re.sub("\\s+", " ", name).strip()
+
+            summary = ' '.join(p.xpath('br/following-sibling::text() | br/following-sibling::*//text()'))
+            summary = re.sub('\\s+', ' ', summary).strip()
+
+            self.opinions.append({
+                'name': name,
+                'url': p.xpath('a/@href')[0],
+                'date': convert_date_string(p.xpath('a/strong/text()')[0]),
+                'summary': summary
+            })
+
+    def _get_case_names(self):
+        return [opinion['name'] for opinion in self.opinions]
+
+    def _get_download_urls(self):
+        return [opinion['url'] for opinion in self.opinions]
+
+    def _get_case_dates(self):
+        return [opinion['date'] for opinion in self.opinions]
+
+    def _get_summaries(self):
+        return [opinion['summary'] for opinion in self.opinions]
+
+    def _get_precedential_statuses(self):
+        return ['Published'] * len(self.opinions)