Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
62 changes: 26 additions & 36 deletions CITATION.cff
Original file line number Diff line number Diff line change
@@ -1,50 +1,40 @@
cff-version: "1.2.0"
title: "PyThaiNLP: Thai Natural Language Processing in Python"
message: >-
If you use this software, please cite it using these
metadata.
type: software
cff-version: 1.2.0
message: "If you use this software, please cite it as below."
title: PyThaiNLP
authors:
- family-names: Phatthiyaphaibun
given-names: Wannaphong
orcid: "https://orcid.org/0000-0002-4153-4354"
orcid: https://orcid.org/0000-0002-4153-4354
- family-names: Chaovavanich
given-names: Korakot
orcid: "https://orcid.org/0009-0002-7350-9855"
orcid: https://orcid.org/0009-0002-7350-9855
- family-names: Polpanumas
given-names: Charin
orcid: "https://orcid.org/0000-0001-7822-4600"
orcid: https://orcid.org/0000-0001-7822-4600
- family-names: Suriyawongkul
given-names: Arthit
orcid: "https://orcid.org/0000-0002-9698-1899"
orcid: https://orcid.org/0000-0002-9698-1899
- family-names: Lowphansirikul
given-names: Lalita
orcid: "https://orcid.org/0000-0002-5305-2088"
orcid: https://orcid.org/0000-0002-5305-2088
- family-names: Chormai
given-names: Pattarawat
orcid: "https://orcid.org/0000-0002-7582-4667"
identifiers:
- type: doi
value: 10.5281/zenodo.3519354
description: >-
This is the collection of archived snapshots of all
versions of PyThaiNLP.
repository-code: "https://github.com/PyThaiNLP/pythainlp/"
repository: "https://github.com/PyThaiNLP/pythainlp/"
url: "https://pythainlp.org/"
abstract: "Thai natural language processing in Python"
keywords:
- "natural language processing"
- "Thai"
- "Python"
- "text processing"
- "computational linguistics"
- "tokenization"
- "localization"
- "word segmentation"
- "NLP"
- "Thai language"
- "Thai NLP"
license: Apache-2.0
orcid: https://orcid.org/0000-0002-7582-4667
abstract: PyThaiNLP is a Thai natural language processing library for Python. It provides standard linguistic analysis for the Thai language, including tokenization and part-of-speech tagging. Additionally, it offers standard Thai locale utility functions, such as Thai Buddhist Era date formatting and the conversion of numbers into Thai text.
repository-code: "https://github.com/PyThaiNLP/pythainlp"
type: software
version: 5.2.0
date-released: "2025-12-20"
license-url: "https://spdx.org/licenses/Apache-2.0"
keywords:
- computational linguistics
- linguistics
- localization
- natural language processing
- NLP
- text analysis
- text processing
- ThaiNLP
- Thai NLP
- Thai language
- tokenization
date-released: 2025-12-20
94 changes: 48 additions & 46 deletions codemeta.json
Original file line number Diff line number Diff line change
@@ -1,45 +1,45 @@
{
"@context": "https://w3id.org/codemeta/3.0",
"type": "SoftwareSourceCode",
"@type": "SoftwareSourceCode",
"applicationCategory": "text analysis",
"author": [
{
"id": "https://orcid.org/0000-0002-4153-4354",
"type": "Person",
"@id": "https://orcid.org/0000-0002-4153-4354",
"@type": "Person",
"familyName": "Phatthiyaphaibun",
"givenName": "Wannaphong"
},
{
"id": "https://orcid.org/0009-0002-7350-9855",
"type": "Person",
"@id": "https://orcid.org/0009-0002-7350-9855",
"@type": "Person",
"familyName": "Chaovavanich",
"givenName": "Korakot"
},
{
"id": "https://orcid.org/0000-0001-7822-4600",
"type": "Person",
"@id": "https://orcid.org/0000-0001-7822-4600",
"@type": "Person",
"familyName": "Polpanumas",
"givenName": "Charin"
},
{
"id": "https://orcid.org/0000-0002-9698-1899",
"type": "Person",
"@id": "https://orcid.org/0000-0002-9698-1899",
"@type": "Person",
"affiliation": {
"type": "Organization",
"@type": "Organization",
"name": "ADAPT Centre, Trinity College Dublin"
},
"familyName": "Suriyawongkul",
"givenName": "Arthit"
},
{
"id": "https://orcid.org/0000-0002-5305-2088",
"type": "Person",
"@id": "https://orcid.org/0000-0002-5305-2088",
"@type": "Person",
"familyName": "Lowphansirikul",
"givenName": "Lalita"
},
{
"id": "https://orcid.org/0000-0002-7582-4667",
"type": "Person",
"@id": "https://orcid.org/0000-0002-7582-4667",
"@type": "Person",
"familyName": "Chormai",
"givenName": "Pattarawat"
}
Expand All @@ -53,6 +53,7 @@
"developmentStatus": "active",
"downloadUrl": "https://github.com/PyThaiNLP/pythainlp/releases",
"identifier": "10.5281/zenodo.3519354",
"isAccessibleForFree": true,
"issueTracker": "https://github.com/PyThaiNLP/pythainlp/issues",
"keywords": [
"computational linguistics",
Expand All @@ -70,16 +71,16 @@
"license": "https://spdx.org/licenses/Apache-2.0",
"maintainer": [
{
"id": "https://orcid.org/0000-0002-4153-4354",
"type": "Person",
"@id": "https://orcid.org/0000-0002-4153-4354",
"@type": "Person",
"familyName": "Phatthiyaphaibun",
"givenName": "Wannaphong"
},
{
"id": "https://orcid.org/0000-0002-9698-1899",
"type": "Person",
"@id": "https://orcid.org/0000-0002-9698-1899",
"@type": "Person",
"affiliation": {
"type": "Organization",
"@type": "Organization",
"name": "ADAPT Centre, Trinity College Dublin"
},
"familyName": "Suriyawongkul",
Expand All @@ -91,101 +92,102 @@
"readme": "https://github.com/PyThaiNLP/pythainlp/blob/dev/README.md",
"referencePublication": [
{
"type": "ScholarlyArticle",
"@type": "ScholarlyArticle",
"author": [
{
"id": "https://orcid.org/0000-0002-4153-4354",
"type": "Person",
"@id": "https://orcid.org/0000-0002-4153-4354",
"@type": "Person",
"affiliation": {
"name": "VISTEC",
"type": "Organization"
"@type": "Organization"
},
"email": "wannaphong.p_s21@vistec.ac.th",
"familyName": "Phatthiyaphaibun",
"givenName": "Wannaphong"
},
{
"id": "https://orcid.org/0009-0002-7350-9855",
"type": "Person",
"@id": "https://orcid.org/0009-0002-7350-9855",
"@type": "Person",
"affiliation": {
"name": "PyThaiNLP",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Chaovavanich",
"givenName": "Korakot"
},
{
"id": "https://orcid.org/0000-0001-7822-4600",
"type": "Person",
"@id": "https://orcid.org/0000-0001-7822-4600",
"@type": "Person",
"affiliation": {
"name": "PyThaiNLP",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Polpanumas",
"givenName": "Charin"
},
{
"id": "https://orcid.org/0000-0002-9698-1899",
"type": "Person",
"@id": "https://orcid.org/0000-0002-9698-1899",
"@type": "Person",
"affiliation": {
"name": "Trinity College Dublin",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Suriyawongkul",
"givenName": "Arthit"
},
{
"id": "https://orcid.org/0000-0002-5305-2088",
"type": "Person",
"@id": "https://orcid.org/0000-0002-5305-2088",
"@type": "Person",
"affiliation": {
"name": "VISTEC",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Lowphansirikul",
"givenName": "Lalita"
},
{
"id": "https://orcid.org/0000-0002-7582-4667",
"type": "Person",
"@id": "https://orcid.org/0000-0002-7582-4667",
"@type": "Person",
"affiliation": {
"name": "Technische Universität Berlin; Max Planck School of Cognition",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Chormai",
"givenName": "Pattarawat"
},
{
"id": "https://orcid.org/0000-0002-7212-8228",
"type": "Person",
"@id": "https://orcid.org/0000-0002-7212-8228",
"@type": "Person",
"affiliation": {
"name": "VISTEC",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Limkonchotiwat",
"givenName": "Peerat"
},
{
"type": "Person",
"@type": "Person",
"affiliation": {
"name": "Wisesight",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Suntorntip",
"givenName": "Thanathip"
},
{
"id": "https://orcid.org/0000-0002-7090-0536",
"type": "Person",
"@id": "https://orcid.org/0000-0002-7090-0536",
"@type": "Person",
"affiliation": {
"name": "VISTEC",
"type": "Organization"
"@type": "Organization"
},
"familyName": "Udomcharoenchaikit",
"givenName": "Can"
}
],
"datePublished": "2023-12-06",
"identifier": "10.18653/v1/2023.nlposs-1.4",
"isAccessibleForFree": true,
"name": "PyThaiNLP: Thai Natural Language Processing in Python",
"url": "https://aclanthology.org/2023.nlposs-1.4/"
}
Expand Down