We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 757042f commit 01d4c91Copy full SHA for 01d4c91
training/text_classification.py
@@ -18,6 +18,9 @@ def main():
18
- stop_words="english"
19
- min_df=5
20
"""
21
+ # this file is available in RNA Resources -> RNAcentral -> RNAcentral References folder on Google Drive.
22
+ # articles up to line 6295 were extracted using the export_data.py script. The last 400 articles were
23
+ # manually reviewed by the team.
24
df = pd.read_csv("data.csv")
25
print(df["rna_related"].value_counts(), "\n")
26
# rna_related
0 commit comments