|
1 | 1 | {
|
2 | 2 | "title": "Sentence Embeddings with transformers.js and umap",
|
3 |
| - "description": "In this video, I cover the node.js \"dotenv\" package and show how to save API credentials as environment variables. ", |
4 |
| - "videoNumber": "4.3", |
| 3 | + "description": "In the livestream, I demonstrate how to visualize sentence embeddings with transfomers.js and umap", |
| 4 | + "videoNumber": "", |
5 | 5 | "videoId": "1mwguqeEz8c",
|
6 | 6 | "date": "2023-12-4",
|
7 | 7 | "languages": ["Transformers.js"],
|
8 |
| - "topics": ["transformers", "embeddings"], |
| 8 | + "topics": ["transformers", "embeddings", "retrieval augmented generation", "umap"], |
9 | 9 | "canContribute": false,
|
10 | 10 | "timestamps": [
|
11 | 11 | { "time": "0:00:00", "title": "Livestream starts" },
|
|
14 | 14 | { "time": "0:20:55", "title": "save embeddigs.json repo" },
|
15 | 15 | { "time": "0:31:29", "title": "What is an embedding?" },
|
16 | 16 | { "time": "0:38:45", "title": "Feature extraction" },
|
17 |
| - { "time": "0:47:31", "title": "Retrieval augmented Generation" }, |
| 17 | + { "time": "0:47:31", "title": "Retrieval Augmented Generation" }, |
18 | 18 | { "time": "0:57:42", "title": "Transformers.js and ONNX" },
|
19 | 19 | { "time": "0:59:22", "title": "Initialize new node project" },
|
20 | 20 | { "time": "1:02:05", "title": "Pipelines" },
|
21 | 21 | { "time": "1:04:15", "title": "Load model function" },
|
22 | 22 | { "time": "1:08:03", "title": "Remove async" },
|
23 |
| - { "time": "1:11:29", "title": "Corpora" } |
| 23 | + { "time": "1:11:29", "title": "Find a dataset on Corpora" }, |
| 24 | + { "time": "1:15:14", "title": "Get embeddings" }, |
| 25 | + { "time": "1:30:51", "title": "Embedding projector" }, |
| 26 | + { "time": "1:49:03", "title": "umap.js" }, |
| 27 | + { "time": "1:54:30", "title": "umap parameters" }, |
| 28 | + { "time": "2:00:51", "title": "Visualize umap results" }, |
| 29 | + { "time": "2:07:71", "title": "Step through one cycle of the algorithm" }, |
| 30 | + { "time": "2:14:56", "title": "Add raw embeddings json data" }, |
| 31 | + { "time": "2:17:47", "title": "Change circles to text" }, |
| 32 | + { "time": "2:24:46", "title": "Things you can try" }, |
| 33 | + { "time": "2:25:23", "title": "Outro" } |
24 | 34 | ],
|
25 | 35 | "codeExamples": [
|
26 | 36 | {
|
27 |
| - "title": "", |
28 |
| - "description": "", |
29 |
| - "image": "", |
30 |
| - "urls": { "p5": "" } |
| 37 | + "title": "Umap - P5 function name embeddings", |
| 38 | + "description": "Visualize the P5 functionname embeddings", |
| 39 | + "image": "p5.jpg", |
| 40 | + "urls": { "p5": "https://editor.p5js.org/a2zitp/sketches/p63QTp0Sd" } |
31 | 41 | },
|
32 | 42 | {
|
33 |
| - "title": "Umap3 - Loading Embeddings", |
34 |
| - "description": "", |
35 |
| - "image": "", |
36 |
| - "urls": { "p5": "https://editor.p5js.org/codingtrain/sketches/AebzAbSpU" } |
| 43 | + "title": "Umap - random embeddings", |
| 44 | + "description": "Visualizing the umap with random data", |
| 45 | + "image": "umap1.jpg", |
| 46 | + "urls": { "p5": "https://editor.p5js.org/codingtrain/sketches/9CpF5OVy4" } |
37 | 47 | },
|
38 | 48 | {
|
39 |
| - "title": "Umap1 - Random Embeddings", |
40 |
| - "description": "", |
41 |
| - "image": "", |
42 |
| - "urls": { "p5": "https://editor.p5js.org/codingtrain/sketches/9CpF5OVy4" } |
| 49 | + "title": "Umap - tv show embeddings", |
| 50 | + "description": "Visualize the tv embeddings", |
| 51 | + "image": "umap3.jpg", |
| 52 | + "urls": { "p5": "https://editor.p5js.org/codingtrain/sketches/AebzAbSpU" } |
43 | 53 | },
|
44 | 54 | {
|
45 | 55 | "title": "Save Embeddings JSON",
|
|
59 | 69 | "description": "Course materials for Embeddings from Programming-from-A-to-Z"
|
60 | 70 | },
|
61 | 71 | {
|
62 |
| - "icon": "", |
| 72 | + "icon": "π", |
63 | 73 | "title": "Transformers.js",
|
64 | 74 | "url": "https://huggingface.co/docs/transformers.js/index",
|
65 | 75 | "description": "Reference for Transformers.js on Hugging Face"
|
66 | 76 | },
|
67 | 77 | {
|
68 |
| - "icon": "", |
| 78 | + "icon": "π", |
69 | 79 | "title": "umap-js Github Repo",
|
70 | 80 | "url": "https://github.com/PAIR-code/umap-js",
|
71 | 81 | "description": "umap-js Github repo"
|
72 | 82 | },
|
73 | 83 | {
|
74 |
| - "icon": "", |
| 84 | + "icon": "π", |
75 | 85 | "title": "Understanding UMAP",
|
76 | 86 | "url": "https://pair-code.github.io/understanding-umap",
|
77 | 87 | "description": "Article by Coenen and Pearce about UMAP."
|
78 | 88 | },
|
79 | 89 | {
|
80 |
| - "icon": "", |
| 90 | + "icon": "π", |
81 | 91 | "title": "RAG for Nature of Code",
|
82 | 92 | "url": "https://huggingface.co/spaces/lilacai/nature-of-code",
|
83 | 93 | "description": "Hugging Face space by lilacai for RAG-NOC"
|
84 | 94 | },
|
85 | 95 | {
|
86 |
| - "icon": "", |
| 96 | + "icon": "π", |
87 | 97 | "title": "C-Pack: Packaged Resources To Advance General Chinese Embedding",
|
88 | 98 | "url": "https://arxiv.org/pdf/2309.07597.pdf",
|
89 | 99 | "description": "Paper proposing C-Pack"
|
|
101 | 111 | "description": "Model card about bge-large-en-v1.5 on Hugging Face"
|
102 | 112 | },
|
103 | 113 | {
|
104 |
| - "icon": "", |
| 114 | + "icon": "π", |
105 | 115 | "title": "ml5",
|
106 | 116 | "url": "https://ml5js.org",
|
107 | 117 | "description": "Website with information and resources about the ml5 library."
|
108 | 118 | },
|
109 | 119 | {
|
110 |
| - "icon": "", |
| 120 | + "icon": "π", |
111 | 121 | "title": "tensorflow.js",
|
112 | 122 | "url": "https://www.tensorflow.org/js",
|
113 | 123 | "description": "Website with information and resources about the tensorflow.js library."
|
114 | 124 | },
|
115 | 125 | {
|
116 |
| - "icon": "", |
| 126 | + "icon": "π", |
117 | 127 | "title": "ONNX Runtime",
|
118 | 128 | "url": "https://onnxruntime.ai/docs/tutorials/web/",
|
119 | 129 | "description": "Tutorial that explains how to run a machine learning model in the brower using ONNX."
|
120 | 130 | },
|
121 | 131 | {
|
122 |
| - "icon": "", |
| 132 | + "icon": "π", |
123 | 133 | "title": "Corpora",
|
124 | 134 | "url": "https://github.com/dariusk/corpora",
|
125 | 135 | "description": "Corpora is a repository of JSON files."
|
126 | 136 | },
|
127 | 137 | {
|
128 |
| - "icon": "", |
| 138 | + "icon": "π", |
129 | 139 | "title": "tv_shows.json",
|
130 | 140 | "url": "https://github.com/dariusk/corpora/blob/master/data/film-tv/tv_shows.json",
|
131 | 141 | "description": "JSON file with a list of 1000 tv shows"
|
| 142 | + }, |
| 143 | + { |
| 144 | + "icon": "π", |
| 145 | + "title": "TV show embeddings", |
| 146 | + "url": "https://raw.githubusercontent.com/CodingTrain/Embeddings-Live/main/tv-embeddings.json", |
| 147 | + "description": "tv show embeddings" |
| 148 | + }, |
| 149 | + { |
| 150 | + "icon": "π", |
| 151 | + "title": "Embedding projector", |
| 152 | + "url": "https://projector.tensorflow.org", |
| 153 | + "description": "Website to visualize text embeddings" |
132 | 154 | }
|
133 | 155 | ]
|
134 | 156 | },
|
|
140 | 162 | "title": "How to Set up A Node Project",
|
141 | 163 | "url": "content/videos/discord/setup-node-project",
|
142 | 164 | "description": "My tutorial about setting up a Node project."
|
| 165 | + }, |
| 166 | + { |
| 167 | + "icon": "π", |
| 168 | + "title": "Introduction to Regular Expressions", |
| 169 | + "url": "https://www.youtube.com/watch?v=7DG3kCDx53c", |
| 170 | + "description": "My video about Regular Expressions." |
| 171 | + }, |
| 172 | + { |
| 173 | + "icon": "π", |
| 174 | + "title": "Exploring Transformers.js Embeddings and Other Updates", |
| 175 | + "url": "https://www.youtube.com/watch?v=RmFqv7Ehi1I", |
| 176 | + "description": "Livestream exploring Transformers.js" |
143 | 177 | }
|
144 | 178 | ]
|
145 | 179 | }
|
|
0 commit comments