Skip to content

Commit 3301629

Browse files
committed
.
1 parent 733e52b commit 3301629

File tree

2 files changed

+47
-24
lines changed

2 files changed

+47
-24
lines changed

python/src/pyx/sparql_bots/render.py

Lines changed: 42 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,20 @@
88
from collections import defaultdict
99
from . import sparql_bot
1010

11+
categoryLabels = {
12+
"Q24905": "فعل",
13+
"Q111029": "جذر",
14+
"Q1084": "اسم",
15+
"Q34698": "صفة",
16+
"Q147276": "اسم علم",
17+
"Q4833830": "حرف جر",
18+
"Q9788": "حرف",
19+
"Q36484": "حرف ربط",
20+
"Q468801": "ضمير شخصي",
21+
"Q63116": "اسم عدد"
22+
}
23+
# ---
24+
1125

1226
def split_data_by_category_list(data):
1327
# ---
@@ -42,7 +56,7 @@ def split_data_by_category_dict(data):
4256
if category not in split_by_category:
4357
split_by_category[category] = {
4458
'category': category,
45-
'categoryLabel': item['categoryLabel'],
59+
'categoryLabel': item.get('categoryLabel') or categoryLabels.get(category, ""),
4660
'members': {}
4761
}
4862
# ---
@@ -125,23 +139,34 @@ def render_duplicate_by_category(limit):
125139
return new, sparql_exec_time
126140

127141

128-
def render_duplicate(limit):
142+
def render_duplicate(limit=0):
129143
# ---
130144
result, sparql_exec_time, err = sparql_bot.find_duplicates()
131-
# # ---
145+
# ---
132146
# result = {x['item']: x for x in result}
133-
# # ---
147+
# ---
134148
# split_by_category = split_data_by_category_dict(result)
135-
# # ---
136-
# new = {}
137-
# # ---
138-
# for cat, tab in split_by_category.items():
139-
# # ---
140-
# members = duplicates_work(tab["members"])
141-
# # ---
142-
# if members:
143-
# tab["lemmas"] = members
144-
# # ---
145-
# new[cat] = tab
146-
# # ---
147-
return result, sparql_exec_time
149+
# ---
150+
new = {}
151+
# ---
152+
# { "lemma_fixed": "تذكير", "category": "Q1084", "items": "L1457168, L1457168", "lemmas": "تذكير, تَذْكِير" }
153+
for tab in result:
154+
# ---
155+
new.setdefault(tab['lemma_fixed'], {
156+
"lemma": tab['lemma_fixed'],
157+
"category": tab['category'],
158+
"categoryLabel": categoryLabels.get(tab['category'], ""),
159+
'members' : []
160+
})
161+
# ---
162+
lemmas = tab['lemmas'].split(",")
163+
items = tab['items'].split(",")
164+
# ---
165+
for lemma, item in zip(lemmas, items):
166+
# ---
167+
new[tab['lemma_fixed']]['members'].append({
168+
"lemma": lemma.strip(),
169+
"item": item.strip(),
170+
})
171+
# ---
172+
return new, sparql_exec_time

python/src/templates/duplicate2.html

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -28,22 +28,21 @@ <h2 class="mb-4" id="header_main">
2828
</tr>
2929
</thead>
3030
<tbody id="table_body">
31-
{%for category, data in result.items() %}
32-
{% for lemma, members in data.lemmas.items() %}
31+
{% for lemma, tab in result.items() %}
3332
<tr>
3433
<td>{{loop.index}}</td>
3534
<td>{{lemma}}</td>
3635
<td>
37-
<a href="https://www.wikidata.org/entity/{{ data.category }}"
38-
target="_blank">{{ data.categoryLabel }}</a>
36+
<a href="https://www.wikidata.org/entity/{{ tab.category }}"
37+
target="_blank">{{ tab.categoryLabel }}</a>
3938
</td>
4039
<td>
41-
{{ members|length }}
40+
{{ tab.members|length }}
4241
</td>
4342
<td>
4443
<div class="w-100">
4544
<div class="list-group list-group-horizontal">
46-
{%for item in members %}
45+
{%for item in tab.members %}
4746
<div class="list-group-item m-1">
4847
<a href="https://www.wikidata.org/entity/{{item.item}}" target="_blank">
4948
<span class="fs-2">
@@ -63,7 +62,6 @@ <h2 class="mb-4" id="header_main">
6362
</td>
6463
</tr>
6564
{%endfor%}
66-
{%endfor%}
6765
</tbody>
6866
</table>
6967
</div>

0 commit comments

Comments
 (0)