|
from pathlib import Path |
|
import gradio as gr |
|
import pii_anonymizer |
|
|
|
def upload_file(filepath): |
|
name = Path(filepath).name |
|
return [gr.UploadButton(visible=False), gr.DownloadButton(label=f"Download {name}", value=filepath, visible=True)] |
|
|
|
def scrub_file(filepath, progress=gr.Progress()): |
|
|
|
stripped_lines = [] |
|
pii_lines = [] |
|
|
|
|
|
with open(filepath, 'r', encoding='utf-8') as file: |
|
for line in file: |
|
stripped_lines.append(line.strip()) |
|
progress(0, desc="Starting...") |
|
for line in progress.tqdm(stripped_lines): |
|
pii_lines.append(pii_anonymizer.anonymize_text_including_proper_nouns_and_addresses(line)) |
|
|
|
|
|
with open(filepath, 'w', encoding='utf-8') as file: |
|
for line in pii_lines: |
|
file.write(line + '\n') |
|
|
|
|
|
name = Path(filepath).name |
|
|
|
|
|
return [gr.UploadButton(visible=False), gr.DownloadButton(label=f"Download {name}", value=filepath, visible=True)] |
|
|
|
|
|
def download_file(): |
|
return [gr.UploadButton(visible=True), gr.DownloadButton(visible=False)] |
|
|
|
with gr.Blocks() as demo: |
|
gr.Markdown("First upload a file and and then you'll be able download a PII stripped version of it (but only once!)") |
|
|
|
with gr.Row(): |
|
u = gr.UploadButton("Upload a file", file_count="single", file_types=["text"]) |
|
d = gr.DownloadButton("Download the file", visible=False) |
|
|
|
|
|
u.upload(scrub_file, u, [u, d]) |
|
d.click(download_file, None, [u, d]) |
|
|
|
|
|
if __name__ == "__main__": |
|
demo.queue().launch() |
|
|