Spaces:
Running
Running
fixes
Browse files- index.html +34 -34
index.html
CHANGED
@@ -12,41 +12,41 @@
|
|
12 |
<body>
|
13 |
<div class="card">
|
14 |
<h1>Visualizing Repo-level Dedupe</h1>
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
},
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
"stack": "normalize"
|
33 |
-
},
|
34 |
-
"color": {
|
35 |
-
"field": "dedupe_factor",
|
36 |
-
"type": "quantitative",
|
37 |
-
"scale": {"domain": [0, 10]}
|
38 |
-
},
|
39 |
-
"tooltip": {"field": "dedupe_factor"},
|
40 |
-
"row": {
|
41 |
-
"field": "repo",
|
42 |
-
"spacing": 1,
|
43 |
-
"header": {"labelAngle": 0, "labelAlign": "left"},
|
44 |
-
"sort": {"field": "dedupe_factor", "order": "descending"}
|
45 |
-
}
|
46 |
}
|
47 |
-
}
|
48 |
-
|
49 |
-
|
50 |
-
|
51 |
</body>
|
52 |
</html>
|
|
|
12 |
<body>
|
13 |
<div class="card">
|
14 |
<h1>Visualizing Repo-level Dedupe</h1>
|
15 |
+
<p>This visualization demonstrates the amount of <a href="https://huggingface.co/blog/from-files-to-chunks">chunk-level dedupe</a> within a repo or across a selection of repos. (For now, demonstrates a hardcoded selection.)</p>
|
16 |
+
</div>
|
17 |
+
<div id="vis"></div>
|
18 |
+
<script>
|
19 |
+
var vlSpec = {
|
20 |
+
"$schema": "https://vega.github.io/schema/vega-lite/v5.json",
|
21 |
+
"resolve": {"scale": {"x": "independent"}},
|
22 |
+
"width": 600,
|
23 |
+
"height": 12,
|
24 |
+
"data": {
|
25 |
+
"url": "xorbs.json"
|
26 |
+
},
|
27 |
+
"mark": "rect",
|
28 |
+
"encoding": {
|
29 |
+
"x": {
|
30 |
+
"field": "xorb_id",
|
31 |
+
"axis": null,
|
32 |
+
"sort": {"field": "dedupe_factor", "order": "descending"},
|
33 |
+
"stack": "normalize"
|
34 |
+
},
|
35 |
+
"color": {
|
36 |
+
"field": "dedupe_factor",
|
37 |
+
"type": "quantitative",
|
38 |
+
"scale": {"domain": [0, 10]}
|
39 |
},
|
40 |
+
"tooltip": {"field": "dedupe_factor"},
|
41 |
+
"row": {
|
42 |
+
"field": "repo",
|
43 |
+
"spacing": 1,
|
44 |
+
"header": {"labelAngle": 0, "labelAlign": "left"},
|
45 |
+
"sort": {"field": "dedupe_factor", "order": "descending"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
46 |
}
|
47 |
+
}
|
48 |
+
};
|
49 |
+
vegaEmbed('#vis', vlSpec);
|
50 |
+
</script>
|
51 |
</body>
|
52 |
</html>
|