ubitux
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎.screenshot.png‎
696 KB b/‎.screenshot.png‎
696 KB
diff --git a/‎LICENSE‎
Lines changed: 674 additions & 0 deletions b/‎LICENSE‎
Lines changed: 674 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 60 additions & 0 deletions b/‎README.md‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 40 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎snapstudysensei/__init__.py‎
Lines changed: 31 additions & 0 deletions b/‎snapstudysensei/__init__.py‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎snapstudysensei/anki.py‎
Lines changed: 174 additions & 0 deletions b/‎snapstudysensei/anki.py‎
Lines changed: 174 additions & 0 deletions
diff --git a/‎snapstudysensei/data/back.html‎
Lines changed: 9 additions & 0 deletions b/‎snapstudysensei/data/back.html‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎snapstudysensei/data/front.html‎
Lines changed: 2 additions & 0 deletions b/‎snapstudysensei/data/front.html‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎snapstudysensei/data/style.css‎
Lines changed: 11 additions & 0 deletions b/‎snapstudysensei/data/style.css‎
Lines changed: 11 additions & 0 deletions
@@ -0,0 +1,2 @@
+SnapStudySensei.egg-info
+venv
@@ -0,0 +1,60 @@
+# SnapStudySensei
+
+**SnapStudySensei** is a tool to assist with capturing, extracting, translating
+and recording Japanese flashcards into [Anki].
+
+This project is inspired by [Game2Text] but takes a different technical approach.
+
+![SnapStudySensei screenshot](.screenshot.png)
+
+
+## Known limitations
+
+- Currently **only supported on Linux**. Porting it to macOS and Windows should
+  be doable by adding the ability to list windows (see `windows_list.py`, patch
+  welcome)
+- **No configuration**, only designed for my own needs so far
+- A bit **slow to start** due to the OCR model initialization
+
+
+## Installation
+
+[Anki] and its [Anki-Connect] plugin must be installed.
+
+```sh
+python -m venv venv
+. venv/bin/activate
+pip install -e .
+```
+
+### Important note
+
+This is a non-intrusive standalone installation, but system input methods (such
+as fcitx) are unlikely to work due to how PySide6 isolation works inside a
+virtual env. Installing it system wide is the only alternative I could find
+so far.
+
+
+## Running
+
+[Anki] and its [Anki-Connect] plugin must be running.
+
+Enter the venv (`. venv/bin/activate`) if you used that installation method, and
+run `sss`.
+
+### Important note
+
+SnapStudySensei will automatically create a model, deck and flashcard templates
+in Anki. The deck is called *SnapStudySensei* and is located in the *Japanese*
+category.
+
+
+## Thanks to
+
+- [Manga OCR](https://github.com/kha-white/manga-ocr/)
+- [JMdict](https://www.edrdg.org/wiki/index.php/JMdict-EDICT_Dictionary_Project)
+
+
+[Anki]: https://apps.ankiweb.net
+[Anki-Connect]: https://foosoft.net/projects/anki-connect
+[Game2Text]: https://game2text.com
@@ -0,0 +1,40 @@
+[project]
+name = "SnapStudySensei"
+version = "0.0.1"
+authors = [
+  { name="Clément Bœsch", email="u@pkh.me" },
+]
+description = "Capture, extract, translate and record Japanese flashcards into Anki"
+readme = "README.md"
+requires-python = ">=3.9"
+classifiers = [
+    "Programming Language :: Python :: 3",
+    "License :: OSI Approved :: GNU General Public License v3 (GPLv3)",
+    "Natural Language :: Japanese",
+]
+dependencies = [
+  'PySide6',
+  'pillow',
+  'xdg-base-dirs',
+  'manga-ocr',
+  'xcffib',
+  'gtts',
+]
+
+[project.urls]
+"Homepage" = "https://github.com/ubitux/SnapStudySensei"
+"Bug Tracker" = "https://github.com/ubitux/SnapStudySensei/issues"
+
+[project.gui-scripts]
+sss = "snapstudysensei:run"
+
+[tool.black]
+line-length = 120
+
+[tool.isort]
+profile = "black"
+line_length = 120
+
+[tool.pyright]
+venv = "venv"
+venvPath = "."
@@ -0,0 +1,31 @@
+def _init_ocr():
+    print(":: initializing Optical Character Recognition")
+    from snapstudysensei.ocr import OCRWrapper
+
+    return OCRWrapper()
+
+
+def _init_dic():
+    print(":: initializing dictionary")
+    from snapstudysensei.dic import JDictionary
+
+    return JDictionary()
+
+
+def _init_tts():
+    print(":: initializing Text-To-Speech")
+    from snapstudysensei.tts import TTSWrapper
+
+    return TTSWrapper()
+
+
+def run():
+    # These initializations could be slow; having a special loading UI or
+    # splashscreen during their init might make sense
+    ocr = _init_ocr()
+    dic = _init_dic()
+    tts = _init_tts()
+
+    from snapstudysensei.main import run as main_run
+
+    main_run(ocr, dic, tts)
@@ -0,0 +1,174 @@
+import base64
+import hashlib
+import json
+import re
+from dataclasses import asdict, dataclass
+from pathlib import Path
+from urllib.request import Request, urlopen
+
+
+@dataclass
+class AnkiNote:
+    word: str
+    context_picture: Path | None
+    context_sentence: str
+    word_reading: str
+    word_glossary: str
+    word_audio: Path | None = None
+    extra_info: str = ""
+    anki_id: int = -1
+
+    def get_qml_record(self):
+        assert self.anki_id != -1
+        reading = self.word_reading.replace("[", "「").replace("]", "」") if self.word_reading else self.word
+        return dict(
+            record_id=str(self.anki_id),  # QML doesn't support 64-bit integers (javascript bs)
+            reading=reading,
+            meaning=self.word_glossary,
+        )
+
+
+class AnkiConnect:
+    PREFIX = "SnapStudySensei"
+    DECK_NAME = f"Japanese::{PREFIX}"
+    MODEL_NAME = f"{PREFIX} Word"
+
+    def __init__(self):
+        deck_ids = self.query("deckNamesAndIds")
+        deck_id = deck_ids.get(self.DECK_NAME)
+        if deck_id is None:
+            deck_id = self.query("createDeck", deck=self.DECK_NAME)
+
+        model_ids = self.query("modelNamesAndIds")
+        model_id = model_ids.get(self.MODEL_NAME)
+        if model_id is None:
+            tpl_dir = Path(__file__).resolve().parent / "data"
+            front = open(tpl_dir / "front.html").read()
+            back = open(tpl_dir / "back.html").read()
+            css = open(tpl_dir / "style.css").read()
+
+            model_id = self.query(
+                "createModel",
+                modelName=self.MODEL_NAME,
+                inOrderFields=[
+                    "Word",
+                    "ContextPicture",
+                    "ContextSentence",
+                    "WordReading",
+                    "WordGlossary",
+                    "WordAudio",
+                    "ExtraInfo",
+                ],
+                css=css,
+                cardTemplates=[dict(Front=front, Back=back)],
+            )
+
+        self.media_dir_path = Path(self.query("getMediaDirPath"))
+
+    def add_note(self, note: AnkiNote) -> AnkiNote:
+        # Craft a ruby string for Anki furigana text on the back side
+        reading = note.word
+        if note.word_reading and note.word_reading != note.word:
+            reading += f"[{note.word_reading}]"
+
+        params = dict(
+            deckName=self.DECK_NAME,
+            modelName=self.MODEL_NAME,
+            fields=dict(
+                Word=note.word,
+                ContextSentence=note.context_sentence,
+                WordReading=reading,
+                WordGlossary=note.word_glossary,
+                ExtraInfo=note.extra_info,
+            ),
+            options=dict(allowDuplicate=True),
+            tags=[self.PREFIX],
+        )
+
+        if note.context_picture:
+            with open(note.context_picture, "rb") as f:
+                picture_filename, data_base64 = self._get_file(note.context_picture)
+            params["picture"] = [dict(filename=picture_filename, data=data_base64, fields=["ContextPicture"])]
+
+        if note.word_audio:
+            with open(note.word_audio, "rb") as f:
+                audio_filename, data_base64 = self._get_file(note.word_audio)
+            params["audio"] = [dict(filename=audio_filename, data=data_base64, fields=["WordAudio"])]
+
+        patched_note = AnkiNote(**asdict(note))
+        patched_note.word_reading = reading
+        patched_note.anki_id = self.query("addNote", note=params)
+        return patched_note
+
+    def _get_file(self, filepath: Path) -> tuple[str, str]:
+        with open(filepath, "rb") as f:
+            content = f.read()
+
+            # Generate a unique filename based on the content
+            picture_hash = hashlib.sha256()
+            picture_hash.update(content)
+            picture_hash = picture_hash.hexdigest()
+
+            # Anki might be a sandboxed app where access to the filesystem is
+            # restricted (typical usecase: a flatpak), so we use a base64 encode
+            # instead of a file path.
+            data_base64 = base64.b64encode(content).decode("utf-8")
+
+        filename = f"{self.PREFIX}_{picture_hash}{filepath.suffix}"
+
+        return filename, data_base64
+
+    def list_notes(self) -> list[AnkiNote]:
+        notes = self.query("findNotes", query=f"deck:{self.DECK_NAME}")
+        notes_info = self.query("notesInfo", notes=notes)
+
+        notes = []
+        for note_info in notes_info:
+            fields = note_info["fields"]
+
+            picture_html = fields["ContextPicture"]["value"]
+            match = re.search(r'src="(?P<filename>[^"]+)"', picture_html)
+            picture_path = self.media_dir_path / match["filename"] if match is not None else None
+
+            audio_markup = fields["WordAudio"]["value"]
+            match = re.search(r"\[sound:(?P<filename>[^\]]+)\]", audio_markup)
+            audio_path = self.media_dir_path / match["filename"] if match is not None else None
+
+            notes.append(
+                AnkiNote(
+                    word=fields["Word"]["value"],
+                    context_picture=picture_path,
+                    context_sentence=fields["ContextSentence"]["value"],
+                    word_reading=fields["WordReading"]["value"],
+                    word_glossary=fields["WordGlossary"]["value"],
+                    word_audio=audio_path,
+                    extra_info=fields["ExtraInfo"]["value"],
+                    anki_id=note_info["noteId"],
+                )
+            )
+
+        return notes
+
+    def remove_note(self, anki_id: int):
+        self.query("deleteNotes", notes=[anki_id])
+
+    @staticmethod
+    def query(action, **params):
+        # print(f"Anki: {action}", params)
+        request_data = dict(action=action, params=params, version=6)
+        request_json = json.dumps(request_data).encode("utf-8")
+        response = json.load(urlopen(Request("http://localhost:8765", request_json)))
+        if len(response) != 2:
+            raise Exception("response has an unexpected number of fields")
+        if "error" not in response:
+            raise Exception("response is missing required error field")
+        if "result" not in response:
+            raise Exception("response is missing required result field")
+        if response["error"] is not None:
+            raise Exception(response["error"])
+        return response["result"]
+
+
+if __name__ == "__main__":
+    a = AnkiConnect()
+    print(a.list_notes())
@@ -0,0 +1,9 @@
+<h1>{{furigana:WordReading}}</h1>
+
+<hr>
+
+<pre>{{WordGlossary}}</pre>
+<p>{{ExtraInfo}}</p>
+<p>{{ContextSentence}}</p>
+<p>{{WordAudio}}</p>
+<p>{{ContextPicture}}</p>
@@ -0,0 +1,2 @@
+<h1>{{Word}}</h1>
+<p>{{hint:ContextSentence}}</p>
@@ -0,0 +1,11 @@
+.card {
+    font-family: sans-serif;
+    font-size: 1.5em;
+    text-align: center;
+    color: white;
+    background-color: #222222;
+    margin-left: auto;
+    margin-right: auto;
+}
+
+pre { text-align: center; }
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+<h1>{{Word}}</h1>`
	`2`	`+<p>{{hint:ContextSentence}}</p>`