Spaces:

openfree
/

svg

Running

App Files Files Community

openfree commited on 3 days ago

Commit

a19af11

verified ·

1 Parent(s): 6c2404b

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -17

app.py CHANGED Viewed

@@ -3,12 +3,12 @@ from datasets import load_dataset
 from rapidfuzz import process, fuzz
 # ──────────────────────────────────────────────────────────
-# 1) 데이터셋 로드 (스트리밍) ─ 메모리에 메타만 저장
 # ──────────────────────────────────────────────────────────
 ds = load_dataset(
     "nyuuzyou/clker-svg",
     split="train",
-    streaming=True,  # .jsonl.zst → 자동 스트리밍 해제
 )
 records = []
 for ex in ds:
@@ -23,16 +23,16 @@ for ex in ds:
     )
 # ──────────────────────────────────────────────────────────
-# 2) 검색 함수
 # ──────────────────────────────────────────────────────────
 def search_svg(query: str, top_k: int):
     if not query.strip():
-        return "⚠️ 검색어를 입력하세요.", None
-    # choices: index(int) ➜ title+tags 한 줄 문자열
     choices = {i: f"{r['title']} {r['tags']}" for i, r in enumerate(records)}
-    # Rapidfuzz: (choice_text, score, key) 반환
     matched = process.extract(
         query,
         choices,
@@ -44,23 +44,23 @@ def search_svg(query: str, top_k: int):
     html_start = '<div class="gallery-grid">'
     html_end = '</div>'
-    for _, score, idx in matched:  # idx 가 실제 list 인덱스
         r = records[idx]
         svg_html = (
             '<div class="gallery-item">'
             f'<div class="svg-container">{r["svg"]}</div>'
             f'<div class="item-details">'
             f'<h3>{r["title"]}</h3>'
-            f'<div class="score">매칭 점수: {score}</div>'
             f'<div class="tags">{r["tags"]}</div>'
-            f'<a href="{r["url"]}" target="_blank" class="download-link">원본 다운로드</a>'
             f'</div>'
             '</div>'
         )
         html_snippets.append(svg_html)
     if not html_snippets:
-        return "검색 결과가 없습니다.", None
     return "", html_start + ''.join(html_snippets) + html_end
@@ -69,8 +69,8 @@ def search_svg(query: str, top_k: int):
 # ──────────────────────────────────────────────────────────
 TITLE = "🔍 Clker SVG"
 DESCRIPTION = """
-이 애플리케이션은 "nyuuzyou/clker-svg" 데이터셋을 사용하여 퍼블릭 도메인 SVG 클립아트를 빠르게 검색할 수 있습니다.
-퍼지 매칭을 통해 제목과 태그에서 유사한 항목을 찾아 시각적 갤러리로 표시합니다.
 """
 DISCORD_BADGE = """<p style="text-align:center; margin-top: -10px;"><a href="https://discord.gg/openfreeai" target="_blank"> <img src="https://img.shields.io/static/v1?label=Discord&message=Openfree%20AI&color=%230000ff&labelColor=%23800080&logo=discord&logoColor=white&style=for-the-badge" alt="badge"></a></p>"""
@@ -151,8 +151,8 @@ with gr.Blocks(title=TITLE, css=CSS) as demo:
     with gr.Row():
         with gr.Column(scale=4):
             query_box = gr.Textbox(
-                label="검색어",
-                placeholder="예: cat, tree, house, computer, flower...",
                 show_label=True
             )
         with gr.Column(scale=1):
@@ -161,11 +161,11 @@ with gr.Blocks(title=TITLE, css=CSS) as demo:
                 maximum=50,
                 value=12,
                 step=3,
-                label="결과 개수"
             )
     with gr.Row():
-        search_button = gr.Button("검색", variant="primary")
     warning_md = gr.Markdown()
     output_html = gr.HTML()
@@ -183,4 +183,4 @@ with gr.Blocks(title=TITLE, css=CSS) as demo:
     )
 if __name__ == "__main__":
-    demo.launch()

 from rapidfuzz import process, fuzz
 # ──────────────────────────────────────────────────────────
+# 1) Load dataset (streaming) ─ only metadata kept in memory
 # ──────────────────────────────────────────────────────────
 ds = load_dataset(
     "nyuuzyou/clker-svg",
     split="train",
+    streaming=True,          # .jsonl.zst → streamed automatically
 )
 records = []
 for ex in ds:
     )
 # ──────────────────────────────────────────────────────────
+# 2) Search function
 # ──────────────────────────────────────────────────────────
 def search_svg(query: str, top_k: int):
     if not query.strip():
+        return "⚠️ Please enter a search term.", None
+    # choices: index(int) ➜ single-line title+tags string
     choices = {i: f"{r['title']} {r['tags']}" for i, r in enumerate(records)}
+    # Rapidfuzz: returns (choice_text, score, key)
     matched = process.extract(
         query,
         choices,
     html_start = '<div class="gallery-grid">'
     html_end = '</div>'
+    for _, score, idx in matched:      # idx is actual list index
         r = records[idx]
         svg_html = (
             '<div class="gallery-item">'
             f'<div class="svg-container">{r["svg"]}</div>'
             f'<div class="item-details">'
             f'<h3>{r["title"]}</h3>'
+            f'<div class="score">Match score: {score}</div>'
             f'<div class="tags">{r["tags"]}</div>'
+            f'<a href="{r["url"]}" target="_blank" class="download-link">Download original</a>'
             f'</div>'
             '</div>'
         )
         html_snippets.append(svg_html)
     if not html_snippets:
+        return "No results found.", None
     return "", html_start + ''.join(html_snippets) + html_end
 # ──────────────────────────────────────────────────────────
 TITLE = "🔍 Clker SVG"
 DESCRIPTION = """
+This application lets you quickly search public-domain SVG clip art using the “nyuuzyou/clker-svg” dataset.
+It finds similar items in titles and tags through fuzzy matching and shows them in a visual gallery.
 """
 DISCORD_BADGE = """<p style="text-align:center; margin-top: -10px;"><a href="https://discord.gg/openfreeai" target="_blank"> <img src="https://img.shields.io/static/v1?label=Discord&message=Openfree%20AI&color=%230000ff&labelColor=%23800080&logo=discord&logoColor=white&style=for-the-badge" alt="badge"></a></p>"""
     with gr.Row():
         with gr.Column(scale=4):
             query_box = gr.Textbox(
+                label="Search term",
+                placeholder="e.g. cat, tree, house, computer, flower...",
                 show_label=True
             )
         with gr.Column(scale=1):
                 maximum=50,
                 value=12,
                 step=3,
+                label="Number of results"
             )
     with gr.Row():
+        search_button = gr.Button("Search", variant="primary")
     warning_md = gr.Markdown()
     output_html = gr.HTML()
     )
 if __name__ == "__main__":
+    demo.launch()