From 776dc0cfb3273dc575adddf04f14d0a83cb7cb7e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Thu, 6 Oct 2022 23:07:20 +0300 Subject: [PATCH 1/7] Datasets, models and summary added to text-to-image task --- tasks/src/text-to-image/about.md | 0 tasks/src/text-to-image/data.ts | 34 ++++++++++++++++++++++++++++++++ 2 files changed, 34 insertions(+) create mode 100644 tasks/src/text-to-image/about.md create mode 100644 tasks/src/text-to-image/data.ts diff --git a/tasks/src/text-to-image/about.md b/tasks/src/text-to-image/about.md new file mode 100644 index 000000000..e69de29bb diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts new file mode 100644 index 000000000..24d1b1426 --- /dev/null +++ b/tasks/src/text-to-image/data.ts @@ -0,0 +1,34 @@ +import type { TaskDataCustom } from "../Types"; + +const taskData: TaskDataCustom = { + datasets: [ + { + description: "Dataset used to train Pokémon text to image model.", + id: "lambdalabs/pokemon-blip-captions", + }, + { + description: "A dataset that contains more than 30K images with their corresponding text from the Shahnameh.", + id: "sadrasabouri/ShahNegar", + }, + ], + demo: { + inputs: [], + outputs: [], + }, + metrics: [], + models: [ + { + description: "A latent text-to-image diffusion model capable of generating photo-realistic images given any text input.", + id: "CompVis/stable-diffusion-v1-4", + }, + { + description: "A latent text-to-image diffusion model that has been conditioned on high-quality anime images through fine-tuning.", + id: "hakurei/waifu-diffusion", + }, + ], + summary: "Generating image from input text. These models that can be used to generate and modify images based on text prompts.", + widgetModels: [], + youtubeId: "", +}; + +export default taskData; From c47de8ef997e1d7565c7923b1cce76568d7d39f6 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Fri, 7 Oct 2022 17:13:47 +0300 Subject: [PATCH 2/7] General purpose model and general purpose datasets are added --- tasks/src/text-to-image/data.ts | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 24d1b1426..635062897 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -3,12 +3,12 @@ import type { TaskDataCustom } from "../Types"; const taskData: TaskDataCustom = { datasets: [ { - description: "Dataset used to train Pokémon text to image model.", - id: "lambdalabs/pokemon-blip-captions", + description: "A large-scale image dataset containing images of everyday objects and people with their textual descriptions.", + id: "ChristophSchuhmann/MS_COCO_2017_URL_TEXT", }, { - description: "A dataset that contains more than 30K images with their corresponding text from the Shahnameh.", - id: "sadrasabouri/ShahNegar", + description: "A dataset created from Midjourney User Prompts & Generated Images", + id: "nateraw/midjourney-texttoimage-new", }, ], demo: { @@ -18,12 +18,12 @@ const taskData: TaskDataCustom = { metrics: [], models: [ { - description: "A latent text-to-image diffusion model capable of generating photo-realistic images given any text input.", - id: "CompVis/stable-diffusion-v1-4", + description: "A model that can be used to generate images based on text prompts. The DALL·E Mega model is the largest version of DALLE Mini.", + id: "dalle-mini/dalle-mega", }, { - description: "A latent text-to-image diffusion model that has been conditioned on high-quality anime images through fine-tuning.", - id: "hakurei/waifu-diffusion", + description: "A latent text-to-image diffusion model capable of generating photo-realistic images given any text input.", + id: "CompVis/stable-diffusion-v1-4", }, ], summary: "Generating image from input text. These models that can be used to generate and modify images based on text prompts.", From 51ec3542cd44a8d66c694c03582fe1649e31030b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Mon, 10 Oct 2022 17:14:51 +0300 Subject: [PATCH 3/7] indent errors are fixed --- tasks/src/text-to-image/data.ts | 26 +++++++++++++------------- 1 file changed, 13 insertions(+), 13 deletions(-) diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 635062897..8bd4e0de4 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -1,34 +1,34 @@ import type { TaskDataCustom } from "../Types"; const taskData: TaskDataCustom = { - datasets: [ + datasets: [ { description: "A large-scale image dataset containing images of everyday objects and people with their textual descriptions.", - id: "ChristophSchuhmann/MS_COCO_2017_URL_TEXT", + id: "ChristophSchuhmann/MS_COCO_2017_URL_TEXT", }, { description: "A dataset created from Midjourney User Prompts & Generated Images", - id: "nateraw/midjourney-texttoimage-new", + id: "nateraw/midjourney-texttoimage-new", }, ], - demo: { - inputs: [], - outputs: [], - }, - metrics: [], - models: [ + demo: { + inputs: [], + outputs: [], + }, + metrics: [], + models: [ { description: "A model that can be used to generate images based on text prompts. The DALL·E Mega model is the largest version of DALLE Mini.", - id: "dalle-mini/dalle-mega", + id: "dalle-mini/dalle-mega", }, { description: "A latent text-to-image diffusion model capable of generating photo-realistic images given any text input.", - id: "CompVis/stable-diffusion-v1-4", + id: "CompVis/stable-diffusion-v1-4", }, ], - summary: "Generating image from input text. These models that can be used to generate and modify images based on text prompts.", + summary: "Generating image from input text. These models that can be used to generate and modify images based on text prompts.", widgetModels: [], - youtubeId: "", + youtubeId: "", }; export default taskData; From 2bb51ad93d408264982a0027c63c23f9425e8df1 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Mon, 10 Oct 2022 17:20:20 +0300 Subject: [PATCH 4/7] Extra space removed for demo attribute --- tasks/src/text-to-image/data.ts | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 8bd4e0de4..7ea091985 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -12,9 +12,9 @@ const taskData: TaskDataCustom = { }, ], demo: { - inputs: [], - outputs: [], - }, + inputs: [], + outputs: [], + }, metrics: [], models: [ { From a9a17be89bc5e74e8bd822ccdc48c5046bc0dbff Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= <61146329+oguzakif@users.noreply.github.com> Date: Mon, 10 Oct 2022 22:33:37 +0300 Subject: [PATCH 5/7] Update tasks/src/text-to-image/data.ts Co-authored-by: Omar Sanseviero --- tasks/src/text-to-image/data.ts | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 7ea091985..7da828a69 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -26,7 +26,7 @@ const taskData: TaskDataCustom = { id: "CompVis/stable-diffusion-v1-4", }, ], - summary: "Generating image from input text. These models that can be used to generate and modify images based on text prompts.", + summary: "Generates images from input text. These models can be used to generate and modify images based on text prompts.", widgetModels: [], youtubeId: "", }; From ec6b924c00d0a017e727356c9d28c8d2c11b9f8e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Tue, 11 Oct 2022 23:01:07 +0300 Subject: [PATCH 6/7] Datasets are changed with more usable ones --- tasks/src/text-to-image/data.ts | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 7da828a69..7c5316e41 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -3,12 +3,12 @@ import type { TaskDataCustom } from "../Types"; const taskData: TaskDataCustom = { datasets: [ { - description: "A large-scale image dataset containing images of everyday objects and people with their textual descriptions.", - id: "ChristophSchuhmann/MS_COCO_2017_URL_TEXT", + description: "RedCaps is a large-scale dataset of 12M image-text pairs collected from Reddit.", + id: "red_caps", }, { - description: "A dataset created from Midjourney User Prompts & Generated Images", - id: "nateraw/midjourney-texttoimage-new", + description: "Conceptual Captions is a dataset consisting of ~3.3M images annotated with captions.", + id: "conceptual_captions", }, ], demo: { From 50238f4fd97d04eb2c96663093e8904ca20a5801 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?O=C4=9Fuz=20Akif=20T=C3=BCfekcio=C4=9Flu?= Date: Wed, 12 Oct 2022 22:19:20 +0300 Subject: [PATCH 7/7] Fixed indent and key-value spaces --- tasks/src/text-to-image/about.md | 0 tasks/src/text-to-image/data.ts | 10 +++++----- 2 files changed, 5 insertions(+), 5 deletions(-) delete mode 100644 tasks/src/text-to-image/about.md diff --git a/tasks/src/text-to-image/about.md b/tasks/src/text-to-image/about.md deleted file mode 100644 index e69de29bb..000000000 diff --git a/tasks/src/text-to-image/data.ts b/tasks/src/text-to-image/data.ts index 7c5316e41..2798a38a4 100644 --- a/tasks/src/text-to-image/data.ts +++ b/tasks/src/text-to-image/data.ts @@ -1,7 +1,7 @@ import type { TaskDataCustom } from "../Types"; const taskData: TaskDataCustom = { - datasets: [ + datasets: [ { description: "RedCaps is a large-scale dataset of 12M image-text pairs collected from Reddit.", id: "red_caps", @@ -11,12 +11,12 @@ const taskData: TaskDataCustom = { id: "conceptual_captions", }, ], - demo: { - inputs: [], + demo: { + inputs: [], outputs: [], }, - metrics: [], - models: [ + metrics: [], + models: [ { description: "A model that can be used to generate images based on text prompts. The DALL·E Mega model is the largest version of DALLE Mini.", id: "dalle-mini/dalle-mega",