znation HF Staff commited on
Commit
d933385
·
1 Parent(s): 7c5aaae
Files changed (1) hide show
  1. index.html +34 -34
index.html CHANGED
@@ -12,41 +12,41 @@
12
  <body>
13
  <div class="card">
14
  <h1>Visualizing Repo-level Dedupe</h1>
15
- <p>This visualization demonstrates the amount of [chunk-level dedupe](https://huggingface.co/blog/from-files-to-chunks) within a repo or across a selection of repos. (For now, demonstrates a hardcoded selection.)</p>
16
- <div id="vis"></div>
17
- <script>
18
- var vlSpec = {
19
- "$schema": "https://vega.github.io/schema/vega-lite/v5.json",
20
- "resolve": {"scale": {"x": "independent"}},
21
- "width": 600,
22
- "height": 12,
23
- "data": {
24
- "url": "xorbs.json"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  },
26
- "mark": "rect",
27
- "encoding": {
28
- "x": {
29
- "field": "xorb_id",
30
- "axis": null,
31
- "sort": {"field": "dedupe_factor", "order": "descending"},
32
- "stack": "normalize"
33
- },
34
- "color": {
35
- "field": "dedupe_factor",
36
- "type": "quantitative",
37
- "scale": {"domain": [0, 10]}
38
- },
39
- "tooltip": {"field": "dedupe_factor"},
40
- "row": {
41
- "field": "repo",
42
- "spacing": 1,
43
- "header": {"labelAngle": 0, "labelAlign": "left"},
44
- "sort": {"field": "dedupe_factor", "order": "descending"}
45
- }
46
  }
47
- };
48
- vegaEmbed('#vis', vlSpec);
49
- </script>
50
- </div>
51
  </body>
52
  </html>
 
12
  <body>
13
  <div class="card">
14
  <h1>Visualizing Repo-level Dedupe</h1>
15
+ <p>This visualization demonstrates the amount of <a href="https://huggingface.co/blog/from-files-to-chunks">chunk-level dedupe</a> within a repo or across a selection of repos. (For now, demonstrates a hardcoded selection.)</p>
16
+ </div>
17
+ <div id="vis"></div>
18
+ <script>
19
+ var vlSpec = {
20
+ "$schema": "https://vega.github.io/schema/vega-lite/v5.json",
21
+ "resolve": {"scale": {"x": "independent"}},
22
+ "width": 600,
23
+ "height": 12,
24
+ "data": {
25
+ "url": "xorbs.json"
26
+ },
27
+ "mark": "rect",
28
+ "encoding": {
29
+ "x": {
30
+ "field": "xorb_id",
31
+ "axis": null,
32
+ "sort": {"field": "dedupe_factor", "order": "descending"},
33
+ "stack": "normalize"
34
+ },
35
+ "color": {
36
+ "field": "dedupe_factor",
37
+ "type": "quantitative",
38
+ "scale": {"domain": [0, 10]}
39
  },
40
+ "tooltip": {"field": "dedupe_factor"},
41
+ "row": {
42
+ "field": "repo",
43
+ "spacing": 1,
44
+ "header": {"labelAngle": 0, "labelAlign": "left"},
45
+ "sort": {"field": "dedupe_factor", "order": "descending"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
+ }
48
+ };
49
+ vegaEmbed('#vis', vlSpec);
50
+ </script>
51
  </body>
52
  </html>