update.

turbou · turbou · commit a25274da939f · 2024-10-20T10:51:36.000+09:00
diff --git a/feeds/index.html b/feeds/index.html
@@ -3,8 +3,10 @@ <h2>リリース情報</h2>
 <hr>
 <h2>RSS feed</h2>
 <h3>Contrast</h3>
-Contrast Release Note<br />
-<a target="_blank" href="https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote.xml">https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote.xml</a>
+Contrast Release Note(SaaS)<br />
+<a target="_blank" href="https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_saas.xml">https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_saas.xml</a>
+Contrast Release Note(On-premises)<br />
+<a target="_blank" href="https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_eop.xml">https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_eop.xml</a>
 <hr />
 <h3>.NET Core</h3>
 .NET Core Agent Release Note<br />
diff --git a/work/contrast_rlsnote.py b/work/contrast_rlsnote.py
@@ -19,7 +19,7 @@ def main():
     feed = Rss201rev2Feed(
         title='Contrast Release Note',
         link='https://contrastsecurity.dev/contrast-documentation-rss',
-        description='Java Agent Release Note',
+        description='Contrast Release Note',
         language='ja',
         author_name="Contrast Security Japan G.K.",
         feed_url='https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote.xml',
diff --git a/work/contrast_rlsnote_eop.py b/work/contrast_rlsnote_eop.py
@@ -0,0 +1,69 @@
+import urllib.request as req 
+from bs4 import BeautifulSoup
+import xml.dom.minidom
+from django.utils.feedgenerator import Rss201rev2Feed
+from datetime import datetime
+import locale
+import re
+import html
+import hashlib
+
+def main():
+    url = 'https://docs.contrastsecurity.jp/ja/release-on-premises.html'
+    res = req.urlopen(url)
+    soup = BeautifulSoup(res, 'lxml')
+    elems = soup.select('section.section')
+    modified_date = soup.select_one('span.formatted-date').text.strip()
+    #print(modified_date)
+
+    feed = Rss201rev2Feed(
+        title='Contrast Release Note(On-premises)',
+        link='https://contrastsecurity.dev/contrast-documentation-rss',
+        description='Contrast Release Note(On-premises)',
+        language='ja',
+        author_name="Contrast Security Japan G.K.",
+        feed_url='https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_eop.xml',
+        feed_copyright='Copyright 2023 Contrast Security Japan G.K.'
+    )
+
+    id_ptn = re.compile(r'^[0-9]{1,2}月-[0-9\-]+-$')
+    title_ptn = re.compile(r'^[0-9]{1,2}月\([0-9\.]+\)$')
+
+    for elem in elems:
+        try:
+            id_str = elem.get("id").strip()
+            title = elem.select('h3.title')[0].text.strip()
+            if not id_ptn.search(id_str) or not title_ptn.search(title):
+                continue
+            pubdate_str = elem.get("data-time-modified") # November 6, 2023
+            pubdate = None
+            if pubdate_str:
+                pubdate = datetime.strptime(pubdate_str, '%B %d, %Y')
+            #print(id_str, pubdate_str, title)
+            desc_buffer = []
+            for elem2 in elem.select('section.section'):
+                id_str2 = elem2.get("id").strip()
+                #print('- ', elem2.select_one('div.titlepage').text)
+                desc_buffer.append('<b>%s</b>' % elem2.select_one('div.titlepage').text)
+                for elem3 in elem2.select('li.listitem'):
+                    #print('  - ', elem3.select_one('p').text)
+                    desc_buffer.append('・%s' % elem3.select_one('p').text)
+            #print(id_str, elem.get('data-legacy-id'))
+            #if not title.lower().startswith('java'):
+            #    continue
+            id_hash = hashlib.md5(id_str.encode()).hexdigest()
+            url = 'https://docs.contrastsecurity.jp/ja/release-on-premises.html#%s' % id_str
+            guid = 'https://docs.contrastsecurity.jp/ja/release-on-premises.html#%s' % id_hash
+            if not '月' in title:
+                continue
+            feed.add_item(title=title, link=url, description=''.join(['<p>{0}</p>'.format(s) for s in desc_buffer]), pubdate=pubdate, unique_id=guid)
+        except IndexError:
+            continue
+    str_val = feed.writeString('utf-8')
+    dom = xml.dom.minidom.parseString(str_val)
+    with open('/feeds/contrast_rlsnote_eop.xml','w') as fp:
+        dom.writexml(fp, encoding='utf-8', newl='\n', indent='', addindent='    ')
+
+if __name__ == "__main__":
+    main()
+
diff --git a/work/contrast_rlsnote_saas.py b/work/contrast_rlsnote_saas.py
@@ -0,0 +1,69 @@
+import urllib.request as req 
+from bs4 import BeautifulSoup
+import xml.dom.minidom
+from django.utils.feedgenerator import Rss201rev2Feed
+from datetime import datetime
+import locale
+import re
+import html
+import hashlib
+
+def main():
+    url = 'https://docs.contrastsecurity.jp/ja/release-hosted.html'
+    res = req.urlopen(url)
+    soup = BeautifulSoup(res, 'lxml')
+    elems = soup.select('section.section')
+    modified_date = soup.select_one('span.formatted-date').text.strip()
+    #print(modified_date)
+
+    feed = Rss201rev2Feed(
+        title='Contrast Release Note(SaaS)',
+        link='https://contrastsecurity.dev/contrast-documentation-rss',
+        description='Contrast Release Note(SaaS)',
+        language='ja',
+        author_name="Contrast Security Japan G.K.",
+        feed_url='https://contrastsecurity.dev/contrast-documentation-rss/contrast_rlsnote_saas.xml',
+        feed_copyright='Copyright 2023 Contrast Security Japan G.K.'
+    )
+
+    id_ptn = re.compile(r'^20[0-9]{2}年[0-9]{1,2}月$')
+    title_ptn = re.compile(r'^20[0-9]{2}年[0-9]{1,2}月$')
+
+    for elem in elems:
+        try:
+            id_str = elem.get("id").strip()
+            title = elem.select('h3.title')[0].text.strip()
+            if not id_ptn.search(id_str) or not title_ptn.search(title):
+                continue
+            pubdate_str = elem.get("data-time-modified") # November 6, 2023
+            pubdate = None
+            if pubdate_str:
+                pubdate = datetime.strptime(pubdate_str, '%B %d, %Y')
+            #print(id_str, pubdate_str, title)
+            desc_buffer = []
+            for elem2 in elem.select('section.section'):
+                id_str2 = elem2.get("id").strip()
+                #print('- ', elem2.select_one('div.titlepage').text)
+                desc_buffer.append('<b>%s</b>' % elem2.select_one('div.titlepage').text)
+                for elem3 in elem2.select('li.listitem'):
+                    #print('  - ', elem3.select_one('p').text)
+                    desc_buffer.append('・%s' % elem3.select_one('p').text)
+            #print(id_str, elem.get('data-legacy-id'))
+            #if not title.lower().startswith('java'):
+            #    continue
+            id_hash = hashlib.md5(id_str.encode()).hexdigest()
+            url = 'https://docs.contrastsecurity.jp/ja/release-hosted.html#%s' % id_str
+            guid = 'https://docs.contrastsecurity.jp/ja/release-hosted.html#%s' % id_hash
+            if not '月' in title:
+                continue
+            feed.add_item(title=title, link=url, description=''.join(['<p>{0}</p>'.format(s) for s in desc_buffer]), pubdate=pubdate, unique_id=guid)
+        except IndexError:
+            continue
+    str_val = feed.writeString('utf-8')
+    dom = xml.dom.minidom.parseString(str_val)
+    with open('/feeds/contrast_rlsnote_saas.xml','w') as fp:
+        dom.writexml(fp, encoding='utf-8', newl='\n', indent='', addindent='    ')
+
+if __name__ == "__main__":
+    main()
+