File size: 12,705 Bytes
68eb6f0
 
 
 
a9c10db
68eb6f0
 
 
5cf84fa
 
68eb6f0
 
 
 
5cf84fa
68eb6f0
5cf84fa
68eb6f0
0a426ed
68eb6f0
 
b53c1d8
 
cb05cc3
68eb6f0
a9c10db
68eb6f0
 
12b1fe6
 
 
68eb6f0
 
 
 
 
 
 
 
 
 
12b1fe6
 
 
 
 
68eb6f0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12b1fe6
 
 
 
 
 
68eb6f0
5cf84fa
68eb6f0
 
 
 
 
 
 
 
 
 
0a426ed
 
 
 
 
 
 
 
 
 
 
 
 
 
68eb6f0
 
 
 
 
b53c1d8
68eb6f0
cb05cc3
68eb6f0
 
 
 
 
 
 
 
 
 
 
 
a9c10db
68eb6f0
 
 
12b1fe6
68eb6f0
 
 
12b1fe6
68eb6f0
 
 
 
 
 
 
 
12b1fe6
 
68eb6f0
a9c10db
 
 
68eb6f0
a9c10db
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
import spaces
import gradio as gr
from hfsearch import (HFSearchResult, search, update_filter, update_df, get_labels, get_valid_labels,
                      get_tags, get_subtag_categories, update_subtag_items, update_tags, update_subtags,
                      search_ref_repos, search_cols, DS_SIZE_CATEGORIES, SPACE_HARDWARES, SPACE_STAGES, TYPES_DESC)
from gradio_huggingfacehub_search import HuggingfaceHubSearch

CSS = """

#container { margin: 0 auto; !important; }

#col-container { margin: 0 auto; !important; }

.title { align-items: center; text-align: center; }

.info { align-items: center; text-align: center; }

"""

with gr.Blocks(theme="NoCrypt/miku", elem_id="container", fill_width=True, css=CSS) as demo:
    gr.Markdown("# Search Hugging Face🤗", elem_classes="title")
    with gr.Column(elem_id="col-container"):
        search_result = gr.State(value=HFSearchResult())
        with gr.Tab("Search"):
            with gr.Group():
                with gr.Row(equal_height=True):
                    repo_types = gr.CheckboxGroup(label="Repo type", choices=["model", "dataset", "space", "collection"], value=["model", "dataset", "space"])
                    filter_str = gr.Textbox(label="Filter", info="String(s) to filter repos", value="")
                    sort = gr.Dropdown(label="Sort", choices=["last_modified", "likes", "downloads", "trending_score"], value="likes")
                with gr.Accordion("Advanced", open=False):
                    ui_mode = gr.Radio(label="Mode", choices=["PC", "Phone"], value="Phone")
                    with gr.Row(equal_height=True):
                        search_str = gr.Textbox(label="Search", info="A string that will be contained in the returned repo ids", placeholder="bert", value="", lines=1)
                        #author = gr.Textbox(label="Author", info="The author (user or organization)", value="", lines=1)
                        author = HuggingfaceHubSearch(label="Author", placeholder="The author (user or organization)", search_type="user", sumbit_on_select=False)
                        followed = HuggingfaceHubSearch(label="Followed by", placeholder="Extract repos followed by this user", search_type="user", sumbit_on_select=False)
                    with gr.Column():
                        tags = gr.Textbox(label="Tags", info="Tag(s) to filter repos", value="")
                        with gr.Accordion("Tag input assistance", open=False):
                            with gr.Row(equal_height=True):
                                tag_item = gr.Dropdown(label="Item", choices=get_tags(), value=get_tags()[0], allow_custom_value=True, scale=4)
                                tag_btn = gr.Button("Add", scale=1)
                            with gr.Row(equal_height=True):
                                subtag_cat = gr.Dropdown(label="Category", choices=get_subtag_categories(), value=get_subtag_categories()[0], scale=2)
                                subtag_item = gr.Dropdown(label="Item", choices=[""], value="", allow_custom_value=True, scale=2)
                                subtug_btn = gr.Button("Add", scale=1)
                    with gr.Row(equal_height=True):
                        with gr.Column():
                            gated_status = gr.Radio(label="Gated status", choices=["gated", "non-gated", "all"], value="all")
                            appr_status = gr.CheckboxGroup(label="Approval method", choices=["auto", "manual"], value=["auto", "manual"])
                        limit = gr.Number(label="Limit", info="If 0, fetches all models", value=1000, step=1, minimum=0, maximum=10000000)
                    with gr.Tab("for Models"):
                        with gr.Column():
                            infer_status = gr.Radio(label="Inference status", choices=["warm", "cold", "frozen", "all"], value="all")
                            gr.Markdown("[About the Inference API status (Warm, Cold, Frozen)](https://huggingface.co./docs/api-inference/supported-models)", elem_classes="info")
                    #    with gr.Row(equal_height=True):
                    #        model_task = gr.Textbox(label="Task", info="String(s) of tasks models were designed for", placeholder="fill-mask", value="")
                    #        trained_dataset = gr.Textbox(label="Trained dataset", info="Trained dataset for a model", value="")
                    with gr.Tab("for Datasets"):
                        size_categories = gr.CheckboxGroup(label="Size categories", info="The size of the dataset", choices=DS_SIZE_CATEGORIES, value=[])
                    #    task_categories = gr.Textbox(label="Task categories", info="Identify datasets by the designed task", value="")
                    #    task_ids = gr.Textbox(label="Task IDs", info="Identify datasets by the specific task", value="")
                    #    language_creators = gr.Textbox(label="Language creators", info="Identify datasets with how the data was curated", value="")
                    #    language = gr.Textbox(label="Language", info="String(s) representing two-character language to filter datasets by", value="")
                    #    multilinguality = gr.Textbox(label="Multilinguality", info="String(s) representing a filter for datasets that contain multiple languages", value="")
                    with gr.Tab("for Spaces"):
                        with gr.Row(equal_height=True):
                            hardware = gr.CheckboxGroup(label="Specify hardware", choices=SPACE_HARDWARES, value=[])
                            stage = gr.CheckboxGroup(label="Specify stage", choices=SPACE_STAGES, value=[])
                    with gr.Accordion("More Advanced", open=False):
                        with gr.Row(equal_height=True):
                            sort_method = gr.Radio(label="Sort method", choices=["ascending order", "descending order"], value="ascending order")
                            fetch_detail = gr.CheckboxGroup(label="Fetch detail", choices=["Space Runtime"], value=["Space Runtime"])
                        with gr.Row(equal_height=True):
                            show_labels = gr.CheckboxGroup(label="Show items", choices=get_labels(), value=get_valid_labels())
                run_button = gr.Button("Search", variant="primary")
        with gr.Tab("Inference API"):
            with gr.Group():
                with gr.Row(equal_height=True):
                    infer_repo_types = gr.CheckboxGroup(label="Repo type", choices=["model", "dataset", "space"], value=["model"], visible=False)
                    with gr.Column():
                        infer_infer_status = gr.Radio(label="Inference status", choices=["warm", "cold", "frozen", "all"], value="warm")
                        gr.Markdown("[About the Inference API status (Warm, Cold, Frozen)](https://huggingface.co./docs/api-inference/supported-models)", elem_classes="info")
                    with gr.Column():
                        infer_gated_status = gr.Radio(label="Gated status", choices=["gated", "non-gated", "all"], value="all")
                        infer_appr_status = gr.CheckboxGroup(label="Approval method", choices=["auto", "manual"], value=["auto", "manual"])
                infer_run_button = gr.Button("Search", variant="primary")
        with gr.Tab("Collections"):
            with gr.Group():
                with gr.Row(equal_height=True):
                    #rec_repo_id = gr.Textbox(label="Repo ID", info="Input your favorite repo", value="")
                    col_repo_id = HuggingfaceHubSearch(label="Repo ID or User ID", placeholder="Input your favorite Repo ID or User ID", search_type=["model", "dataset", "space", "user"],
                                                       sumbit_on_select=False)
                    col_sort = gr.Dropdown(label="Sort", choices=["last_modified", "trending_score", "likes"], value="likes")
                with gr.Row(equal_height=True):
                    col_repo_limit = gr.Number(label="Limit for repos", value=50, step=1, minimum=1, maximum=100)
                    col_user_limit = gr.Number(label="Limit for users", value=10, step=1, minimum=0, maximum=50)
                with gr.Accordion("Advanced", open=False):
                    col_show_labels = gr.CheckboxGroup(label="Show items", choices=get_labels(), value=get_valid_labels())
            col_run_button = gr.Button("Search", variant="primary")
        with gr.Tab("Recommended repos"):
            with gr.Group():
                with gr.Row(equal_height=True):
                    #rec_repo_id = gr.Textbox(label="Repo ID", info="Input your favorite repo", value="")
                    rec_repo_id = HuggingfaceHubSearch(label="Repo ID", placeholder="Input your favorite Repo ID", search_type=["model", "dataset", "space"],
                                                       sumbit_on_select=False)
                    rec_repo_types = gr.CheckboxGroup(label="Repo type", choices=["model", "dataset", "space", "collection"], value=["model", "dataset", "space", "collection"])
                with gr.Row(equal_height=True):
                    rec_sort = gr.Dropdown(label="Sort", choices=["last_modified", "likes", "downloads", "downloads_all_time", "trending_score"], value="likes")
                    rec_limit = gr.Number(label="Limit", value=20, step=1, minimum=1, maximum=1000)
                with gr.Accordion("Advanced", open=False):
                    with gr.Row(equal_height=True):
                        rec_show_labels = gr.CheckboxGroup(label="Show items", choices=get_labels(), value=get_valid_labels())
            rec_run_button = gr.Button("Search", variant="primary")
        with gr.Group():
            with gr.Accordion("Filter", open=False):
                hide_labels = gr.CheckboxGroup(label="Hide items", choices=[], value=[], visible=False)
                with gr.Row(equal_height=True):
                    filter_item1 = gr.Dropdown(label="Filter item", choices=[""], value="", visible=False)
                    filter1 = gr.Dropdown(label="Filter", choices=[""], value="", allow_custom_value=True, visible=False)
                    filter_btn = gr.Button("Apply filter", variant="secondary", visible=False)
            types_desc = gr.Markdown(TYPES_DESC, elem_classes="info")
            result_df = gr.DataFrame(label="Results", type="pandas", value=None, interactive=False)

    run_button.click(search, [repo_types, sort, sort_method, filter_str, search_str, author, tags, infer_status, gated_status, appr_status,
                              size_categories, limit, hardware, stage, followed, fetch_detail, show_labels, ui_mode, search_result],
                     [result_df, hide_labels, search_result])\
    .success(update_filter, [filter_item1, search_result], [filter_item1, filter1, filter_btn, search_result], queue=False)
    infer_run_button.click(search, [infer_repo_types, sort, sort_method, filter_str, search_str, author, tags, infer_infer_status, infer_gated_status, infer_appr_status,
                                    size_categories, limit, hardware, stage, followed, fetch_detail, show_labels, ui_mode, search_result],
                           [result_df, hide_labels, search_result])\
    .success(update_filter, [filter_item1, search_result], [filter_item1, filter1, filter_btn, search_result], queue=False)
    gr.on(triggers=[hide_labels.change, filter_btn.click], fn=update_df, inputs=[hide_labels, filter_item1, filter1, search_result],
          outputs=[result_df, search_result], trigger_mode="once", queue=False, show_api=False)
    filter_item1.change(update_filter, [filter_item1, search_result], [filter_item1, filter1, filter_btn, search_result], queue=False, show_api=False)
    subtag_cat.change(update_subtag_items, [subtag_cat], [subtag_item], queue=False, show_api=False)
    subtug_btn.click(update_subtags, [tags, subtag_cat, subtag_item], [tags], queue=False, show_api=False)
    tag_btn.click(update_tags, [tags, tag_item], [tags], queue=False, show_api=False)
    gr.on(triggers=[rec_run_button.click, rec_repo_id.submit], fn=search_ref_repos,
          inputs=[rec_repo_id, rec_repo_types, rec_sort, rec_show_labels, rec_limit, ui_mode, search_result],
          outputs=[result_df, hide_labels, search_result])
    gr.on(triggers=[col_run_button.click, col_repo_id.submit], fn=search_cols,
          inputs=[col_repo_id, col_sort, col_show_labels, col_repo_limit, col_user_limit, ui_mode, search_result],
          outputs=[result_df, hide_labels, search_result])

demo.queue().launch(ssr_mode=False)