m7n commited on
Commit
d37c745
·
1 Parent(s): 41c382c

Update datamapplot dependency and minor UI text adjustments

Browse files
Files changed (2) hide show
  1. app.py +5 -5
  2. requirements.txt +1 -1
app.py CHANGED
@@ -372,7 +372,7 @@ def predict(request: gr.Request, text_input, sample_size_slider, reduce_sample_c
372
 
373
  hover_text=[str(row['title']) for ix, row in stacked_df.iterrows()],
374
  marker_color_array=stacked_df['color'],
375
- use_medoids=False, # Switch back once efficient mediod caclulation comes out!
376
  width=1000,
377
  height=1000,
378
  point_radius_min_pixels=1,
@@ -401,7 +401,7 @@ def predict(request: gr.Request, text_input, sample_size_slider, reduce_sample_c
401
  print(f"Plot created and saved in {time.time() - plot_start:.2f} seconds")
402
 
403
 
404
-
405
  # Save additional files if requested
406
  csv_file_path = static_dir / f"{filename}.csv"
407
  png_file_path = static_dir / f"{filename}.png"
@@ -429,7 +429,7 @@ def predict(request: gr.Request, text_input, sample_size_slider, reduce_sample_c
429
 
430
  # Get the 30 most common labels
431
  unique_labels, counts = np.unique(combined_labels, return_counts=True)
432
- top_30_labels = set(unique_labels[np.argsort(counts)[-50:]])
433
 
434
  # Replace less common labels with 'Unlabelled'
435
  combined_labels = np.array(['Unlabelled' if label not in top_30_labels else label for label in combined_labels])
@@ -451,7 +451,7 @@ def predict(request: gr.Request, text_input, sample_size_slider, reduce_sample_c
451
  label_wrap_width=12,
452
  label_over_points=True,
453
  dynamic_label_size=True,
454
- use_medoids=False, # Switch back once efficient mediod caclulation comes out!
455
  point_size=2,
456
  marker_color_array=colors_base,
457
  force_matplotlib=True,
@@ -583,7 +583,7 @@ with gr.Blocks(theme=theme, css="""
583
 
584
  OpenAlex Mapper is a way of projecting search queries from the amazing OpenAlex database on a background map of randomly sampled papers from OpenAlex, which allows you to easily investigate interdisciplinary connections. OpenAlex Mapper was developed by [Maximilian Noichl](https://maxnoichl.eu) and [Andrea Loettgers](https://unige.academia.edu/AndreaLoettgers) at the [Possible Life project](http://www.possiblelife.eu/).
585
 
586
- To use OpenAlex Mapper, first head over to [OpenAlex](https://openalex.org/) and search for something that interests you. For example, you could search for all the papers that make use of the [Kuramoto model](https://openalex.org/works?page=1&filter=default.search%3A%22Kuramoto%20Model%22), for all the papers that were published by researchers at [Utrecht University in 2019](https://openalex.org/works?page=1&filter=authorships.institutions.lineage%3Ai193662353,publication_year%3A2019), or for all the papers that cite Wittgenstein's [Philosophical Investigations](https://openalex.org/works?page=1&filter=cites%3Aw4251395411). Then you copy the URL to that search query into the OpenAlex search URL box below and click "Run Query." It will download all of these records from OpenAlex and embed them on our interactive map. As the embedding step is a little expensive, computationally, it's often a good idea to play around with smaller samples, before running a larger analysis (see below for a note on sample size and run-time). After a little time, that map will appear and be available for you to interact with and download. You can find more explanations in the FAQs below.
587
  </div>
588
 
589
  """)
 
372
 
373
  hover_text=[str(row['title']) for ix, row in stacked_df.iterrows()],
374
  marker_color_array=stacked_df['color'],
375
+ use_medoids=True, # Switch back once efficient mediod caclulation comes out!
376
  width=1000,
377
  height=1000,
378
  point_radius_min_pixels=1,
 
401
  print(f"Plot created and saved in {time.time() - plot_start:.2f} seconds")
402
 
403
 
404
+ #datamapplot==0.5.1
405
  # Save additional files if requested
406
  csv_file_path = static_dir / f"{filename}.csv"
407
  png_file_path = static_dir / f"{filename}.png"
 
429
 
430
  # Get the 30 most common labels
431
  unique_labels, counts = np.unique(combined_labels, return_counts=True)
432
+ top_30_labels = set(unique_labels[np.argsort(counts)[-80:]])
433
 
434
  # Replace less common labels with 'Unlabelled'
435
  combined_labels = np.array(['Unlabelled' if label not in top_30_labels else label for label in combined_labels])
 
451
  label_wrap_width=12,
452
  label_over_points=True,
453
  dynamic_label_size=True,
454
+ use_medoids=True, # Switch back once efficient mediod caclulation comes out!
455
  point_size=2,
456
  marker_color_array=colors_base,
457
  force_matplotlib=True,
 
583
 
584
  OpenAlex Mapper is a way of projecting search queries from the amazing OpenAlex database on a background map of randomly sampled papers from OpenAlex, which allows you to easily investigate interdisciplinary connections. OpenAlex Mapper was developed by [Maximilian Noichl](https://maxnoichl.eu) and [Andrea Loettgers](https://unige.academia.edu/AndreaLoettgers) at the [Possible Life project](http://www.possiblelife.eu/).
585
 
586
+ To use OpenAlex Mapper, first head over to [OpenAlex](https://openalex.org/) and search for something that interests you. For example, you could search for all the papers that make use of the [Kuramoto model](https://openalex.org/works?page=1&filter=default.search%3A%22Kuramoto%20Model%22), for all the papers that were published by researchers at [Utrecht University in 2019](https://openalex.org/works?page=1&filter=authorships.institutions.lineage%3Ai193662353,publication_year%3A2019), or for all the papers that cite Wittgenstein's [Philosophical Investigations](https://openalex.org/works?page=1&filter=cites%3Aw4251395411). Then you copy the URL to that search query into the OpenAlex search URL box below and click "Run Query." It will download all of these records from OpenAlex and embed them on our interactive map. As the embedding step is a little expensive, computationally, it's often a good idea to play around with smaller samples, before running a larger analysis (see below for a note on sample size and gpu-limits). After a little time, that map will appear and be available for you to interact with and download. You can find more explanations in the FAQs below.
587
  </div>
588
 
589
  """)
requirements.txt CHANGED
@@ -10,7 +10,7 @@ adapters
10
  torch
11
  tqdm
12
  pyarrow
13
- datamapplot==0.5.1
14
  numba==0.58.1
15
  umap-learn==0.5.7
16
  pynndescent==0.5.12
 
10
  torch
11
  tqdm
12
  pyarrow
13
+ git+https://github.com/TutteInstitute/datamapplot.git
14
  numba==0.58.1
15
  umap-learn==0.5.7
16
  pynndescent==0.5.12