Skip to content

Commit

Permalink
Merge pull request #419 from georgetown-cset/359-update-incompleteness
Browse files Browse the repository at this point in the history
Update incompleteness interval
  • Loading branch information
brianlove authored Jun 13, 2024
2 parents 231b272 + 82fbdd2 commit d0c1749
Show file tree
Hide file tree
Showing 6 changed files with 20 additions and 18 deletions.
2 changes: 1 addition & 1 deletion web/gui-v2/src/static_data/data.js

Large diffs are not rendered by default.

2 changes: 1 addition & 1 deletion web/gui-v2/src/static_data/overall_data.json
Original file line number Diff line number Diff line change
@@ -1 +1 @@
{"years": [2013, 2014, 2015, 2016, 2017, 2018, 2019, 2020, 2021, 2022, 2023], "startArticleYear": 2019, "endArticleYear": 2022, "startPatentYear": 2017, "endPatentYear": 2020, "groups": {"sp500": {"cset_id": 1000500, "name": "S&P 500", "articles": {"all_publications": {"total": 944, "counts": [78, 78, 81, 83, 85, 87, 92, 96, 94, 87, 82]}, "ai_publications": {"total": 104, "counts": [4, 4, 5, 6, 7, 10, 13, 16, 16, 12, 11]}, "ai_publications_growth": {"total": 3, "counts": []}, "highly_cited_ai_pubs": {"total": 23, "counts": [1, 1, 1, 2, 2, 3, 3, 4, 3, 2, 1]}, "ai_pubs_top_conf": {"total": 33, "counts": [1, 1, 2, 2, 2, 3, 5, 5, 6, 4, 3]}, "ai_citation_counts": {"total": 5733, "counts": [50, 74, 105, 150, 224, 364, 549, 768, 1002, 1099, 1347]}, "cv_citation_counts": {"total": 2862, "counts": [21, 31, 45, 65, 104, 179, 279, 380, 502, 561, 696]}, "nlp_citation_counts": {"total": 1269, "counts": [10, 16, 25, 39, 55, 86, 122, 167, 212, 234, 304]}, "robotics_citation_counts": {"total": 257, "counts": [4, 5, 7, 8, 12, 17, 24, 32, 41, 47, 61]}, "cv_publications": {"total": 28, "counts": [1, 1, 1, 2, 2, 3, 3, 4, 4, 3, 3]}, "nlp_publications": {"total": 21, "counts": [1, 1, 1, 1, 1, 2, 3, 4, 4, 3, 2]}, "robotics_publications": {"total": 7, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]}, "ai_citations_per_article": {"total": 11, "counts": [1, 2, 3, 3, 4, 6, 7, 8, 12, 16, 19]}, "all_pubs_5yr": {"total": 457, "counts": []}, "ai_pubs_percent": {"total": 5, "counts": []}, "ai_pubs_last_full_year": {"total": 12, "counts": []}}, "patents": {"ai_patents": {"total": 94, "counts": [2, 3, 4, 6, 9, 12, 14, 16, 16, 13, 0]}, "ai_patents_growth": {"total": 20, "counts": []}, "ai_patents_grants": {"total": 55, "counts": []}, "all_patents": {"total": 1370, "counts": [144, 138, 138, 139, 137, 134, 135, 132, 133, 136, 4]}, "Physical_Sciences_and_Engineering": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Life_Sciences": {"total": 7, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Security__eg_cybersecurity": {"total": 6, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Transportation": {"total": 8, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "Industrial_and_Manufacturing": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Education": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Document_Mgt_and_Publishing": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Military": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Agricultural": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Computing_in_Government": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Personal_Devices_and_Computing": {"total": 52, "counts": [1, 1, 2, 3, 5, 8, 9, 9, 8, 5, 0]}, "Banking_and_Finance": {"total": 5, "counts": [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0]}, "Telecommunications": {"total": 22, "counts": [0, 1, 1, 1, 2, 3, 3, 4, 4, 3, 0]}, "Networks__eg_social_IOT_etc": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Business": {"total": 13, "counts": [0, 0, 1, 1, 2, 2, 2, 2, 2, 1, 0]}, "Energy_Management": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Entertainment": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Nanotechnology": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Semiconductors": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Language_Processing": {"total": 2, "counts": [0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0]}, "Speech_Processing": {"total": 5, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Knowledge_Representation": {"total": 9, "counts": [0, 0, 0, 1, 1, 2, 1, 1, 1, 1, 0]}, "Planning_and_Scheduling": {"total": 8, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "Control": {"total": 10, "counts": [0, 0, 0, 1, 1, 2, 2, 1, 1, 1, 0]}, "Distributed_AI": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Robotics": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Computer_Vision": {"total": 16, "counts": [0, 0, 1, 1, 2, 3, 2, 3, 2, 2, 0]}, "Analytics_and_Algorithms": {"total": 8, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 2, 1, 0]}, "Measuring_and_Testing": {"total": 7, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "all_patents_5yr": {"total": 678, "counts": []}, "ai_patents_percent": {"total": 6, "counts": []}}, "other_metrics": {"tt1_jobs": {"total": 3546, "counts": null}, "ai_jobs": {"total": 316, "counts": null}}}, "globalBigTech": {"cset_id": 1000502, "name": "Global Big Tech", "articles": {"all_publications": {"total": 9854, "counts": [639, 683, 698, 720, 769, 872, 1047, 1174, 1256, 1039, 958]}, "ai_publications": {"total": 3455, "counts": [94, 111, 125, 147, 194, 300, 453, 554, 613, 463, 401]}, "ai_publications_growth": {"total": 8, "counts": []}, "highly_cited_ai_pubs": {"total": 834, "counts": [26, 32, 39, 48, 66, 91, 125, 127, 141, 92, 47]}, "ai_pubs_top_conf": {"total": 1317, "counts": [36, 35, 51, 52, 77, 121, 184, 194, 256, 182, 129]}, "ai_citation_counts": {"total": 181424, "counts": [1311, 1956, 2840, 4204, 6428, 10801, 16844, 23981, 31990, 36000, 45068]}, "cv_citation_counts": {"total": 94781, "counts": [573, 843, 1246, 1870, 3106, 5476, 8793, 12323, 16793, 19292, 24466]}, "nlp_citation_counts": {"total": 41688, "counts": [293, 456, 728, 1180, 1682, 2703, 3941, 5504, 7077, 7935, 10190]}, "robotics_citation_counts": {"total": 5878, "counts": [62, 80, 102, 129, 192, 324, 530, 731, 976, 1150, 1601]}, "cv_publications": {"total": 1079, "counts": [27, 33, 38, 42, 57, 86, 131, 162, 198, 162, 144]}, "nlp_publications": {"total": 790, "counts": [22, 25, 29, 33, 41, 67, 110, 136, 147, 106, 74]}, "robotics_publications": {"total": 146, "counts": [3, 4, 4, 6, 7, 12, 19, 22, 26, 23, 20]}, "ai_citations_per_article": {"total": 45, "counts": [13, 14, 16, 20, 24, 28, 29, 35, 45, 92, 182]}, "all_pubs_5yr": {"total": 5388, "counts": []}, "ai_pubs_percent": {"total": 39, "counts": []}, "ai_pubs_last_full_year": {"total": 463, "counts": []}}, "patents": {"ai_patents": {"total": 3187, "counts": [40, 57, 84, 141, 232, 315, 417, 586, 604, 532, 180]}, "ai_patents_growth": {"total": 31, "counts": []}, "ai_patents_grants": {"total": 1674, "counts": []}, "all_patents": {"total": 23013, "counts": [1819, 1771, 1932, 2125, 2135, 2317, 2638, 2635, 2606, 2518, 518]}, "Physical_Sciences_and_Engineering": {"total": 12, "counts": [0, 0, 0, 1, 1, 2, 1, 2, 2, 2, 1]}, "Life_Sciences": {"total": 120, "counts": [2, 3, 4, 8, 13, 14, 20, 22, 18, 13, 4]}, "Security__eg_cybersecurity": {"total": 132, "counts": [2, 3, 3, 6, 13, 18, 21, 25, 23, 17, 3]}, "Transportation": {"total": 181, "counts": [2, 2, 5, 10, 17, 27, 29, 31, 22, 23, 12]}, "Industrial_and_Manufacturing": {"total": 50, "counts": [0, 1, 1, 3, 5, 4, 7, 9, 8, 7, 4]}, "Education": {"total": 21, "counts": [1, 1, 1, 1, 3, 3, 3, 3, 3, 2, 0]}, "Document_Mgt_and_Publishing": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Military": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Agricultural": {"total": 9, "counts": [0, 0, 0, 1, 1, 1, 1, 2, 1, 2, 0]}, "Computing_in_Government": {"total": 8, "counts": [0, 0, 0, 0, 0, 0, 1, 2, 2, 1, 0]}, "Personal_Devices_and_Computing": {"total": 1793, "counts": [20, 30, 45, 83, 141, 193, 258, 370, 354, 233, 65]}, "Banking_and_Finance": {"total": 55, "counts": [1, 1, 2, 3, 6, 8, 10, 9, 11, 4, 2]}, "Telecommunications": {"total": 530, "counts": [8, 15, 18, 29, 53, 68, 76, 101, 86, 65, 12]}, "Networks__eg_social_IOT_etc": {"total": 57, "counts": [2, 3, 4, 8, 11, 8, 4, 8, 5, 3, 0]}, "Business": {"total": 300, "counts": [7, 10, 13, 24, 36, 38, 40, 54, 44, 28, 7]}, "Energy_Management": {"total": 20, "counts": [1, 1, 0, 1, 2, 2, 2, 3, 4, 4, 1]}, "Entertainment": {"total": 41, "counts": [1, 0, 1, 1, 2, 3, 6, 9, 9, 7, 3]}, "Nanotechnology": {"total": 3, "counts": [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0]}, "Semiconductors": {"total": 15, "counts": [0, 0, 1, 1, 2, 2, 1, 3, 3, 2, 0]}, "Language_Processing": {"total": 64, "counts": [3, 5, 10, 15, 22, 9, 0, 0, 0, 0, 0]}, "Speech_Processing": {"total": 224, "counts": [4, 4, 6, 11, 20, 25, 32, 45, 42, 29, 6]}, "Knowledge_Representation": {"total": 222, "counts": [8, 10, 11, 18, 34, 34, 31, 31, 25, 17, 3]}, "Planning_and_Scheduling": {"total": 178, "counts": [4, 5, 8, 15, 21, 22, 23, 33, 26, 17, 4]}, "Control": {"total": 157, "counts": [2, 3, 6, 12, 22, 30, 31, 24, 15, 10, 2]}, "Distributed_AI": {"total": 13, "counts": [0, 0, 0, 1, 2, 3, 2, 2, 1, 1, 0]}, "Robotics": {"total": 2, "counts": [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]}, "Computer_Vision": {"total": 543, "counts": [6, 8, 11, 25, 55, 73, 69, 101, 97, 78, 21]}, "Analytics_and_Algorithms": {"total": 141, "counts": [3, 3, 5, 8, 11, 17, 20, 26, 26, 20, 3]}, "Measuring_and_Testing": {"total": 118, "counts": [2, 2, 4, 7, 11, 17, 19, 24, 16, 13, 3]}, "all_patents_5yr": {"total": 11850, "counts": []}, "ai_patents_percent": {"total": 17, "counts": []}}, "other_metrics": {"tt1_jobs": {"total": 41012, "counts": null}, "ai_jobs": {"total": 2817, "counts": null}}}}, "groupIdOffset": 1000000}
{"years": [2013, 2014, 2015, 2016, 2017, 2018, 2019, 2020, 2021, 2022, 2023], "startArticleYear": 2018, "endArticleYear": 2021, "startPatentYear": 2017, "endPatentYear": 2020, "groups": {"sp500": {"cset_id": 1000500, "name": "S&P 500", "articles": {"all_publications": {"total": 944, "counts": [78, 78, 81, 83, 85, 87, 92, 96, 94, 87, 82]}, "ai_publications": {"total": 104, "counts": [4, 4, 5, 6, 7, 10, 13, 16, 16, 12, 11]}, "ai_publications_growth": {"total": 12, "counts": []}, "highly_cited_ai_pubs": {"total": 23, "counts": [1, 1, 1, 2, 2, 3, 3, 4, 3, 2, 1]}, "ai_pubs_top_conf": {"total": 33, "counts": [1, 1, 2, 2, 2, 3, 5, 5, 6, 4, 3]}, "ai_citation_counts": {"total": 5733, "counts": [50, 74, 105, 150, 224, 364, 549, 768, 1002, 1099, 1347]}, "cv_citation_counts": {"total": 2862, "counts": [21, 31, 45, 65, 104, 179, 279, 380, 502, 561, 696]}, "nlp_citation_counts": {"total": 1269, "counts": [10, 16, 25, 39, 55, 86, 122, 167, 212, 234, 304]}, "robotics_citation_counts": {"total": 257, "counts": [4, 5, 7, 8, 12, 17, 24, 32, 41, 47, 61]}, "cv_publications": {"total": 28, "counts": [1, 1, 1, 2, 2, 3, 3, 4, 4, 3, 3]}, "nlp_publications": {"total": 21, "counts": [1, 1, 1, 1, 1, 2, 3, 4, 4, 3, 2]}, "robotics_publications": {"total": 7, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1]}, "ai_citations_per_article": {"total": 11, "counts": [1, 2, 3, 3, 4, 6, 7, 8, 12, 16, 19]}, "all_pubs_5yr": {"total": 455, "counts": []}, "ai_pubs_percent": {"total": 5, "counts": []}, "ai_pubs_last_full_year": {"total": 16, "counts": []}}, "patents": {"ai_patents": {"total": 94, "counts": [2, 3, 4, 6, 9, 12, 14, 16, 16, 13, 0]}, "ai_patents_growth": {"total": 20, "counts": []}, "ai_patents_grants": {"total": 55, "counts": []}, "all_patents": {"total": 1370, "counts": [144, 138, 138, 139, 137, 134, 135, 132, 133, 136, 4]}, "Physical_Sciences_and_Engineering": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Life_Sciences": {"total": 7, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Security__eg_cybersecurity": {"total": 6, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Transportation": {"total": 8, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "Industrial_and_Manufacturing": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Education": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Document_Mgt_and_Publishing": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Military": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Agricultural": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Computing_in_Government": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Personal_Devices_and_Computing": {"total": 52, "counts": [1, 1, 2, 3, 5, 8, 9, 9, 8, 5, 0]}, "Banking_and_Finance": {"total": 5, "counts": [0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0]}, "Telecommunications": {"total": 22, "counts": [0, 1, 1, 1, 2, 3, 3, 4, 4, 3, 0]}, "Networks__eg_social_IOT_etc": {"total": 2, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Business": {"total": 13, "counts": [0, 0, 1, 1, 2, 2, 2, 2, 2, 1, 0]}, "Energy_Management": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Entertainment": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Nanotechnology": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Semiconductors": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Language_Processing": {"total": 2, "counts": [0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0]}, "Speech_Processing": {"total": 5, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0]}, "Knowledge_Representation": {"total": 9, "counts": [0, 0, 0, 1, 1, 2, 1, 1, 1, 1, 0]}, "Planning_and_Scheduling": {"total": 8, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "Control": {"total": 10, "counts": [0, 0, 0, 1, 1, 2, 2, 1, 1, 1, 0]}, "Distributed_AI": {"total": 1, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Robotics": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Computer_Vision": {"total": 16, "counts": [0, 0, 1, 1, 2, 3, 2, 3, 2, 2, 0]}, "Analytics_and_Algorithms": {"total": 8, "counts": [0, 0, 0, 0, 1, 1, 1, 1, 2, 1, 0]}, "Measuring_and_Testing": {"total": 7, "counts": [0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0]}, "all_patents_5yr": {"total": 678, "counts": []}, "ai_patents_percent": {"total": 6, "counts": []}}, "other_metrics": {"tt1_jobs": {"total": 3546, "counts": null}, "ai_jobs": {"total": 316, "counts": null}}}, "globalBigTech": {"cset_id": 1000502, "name": "Global Big Tech", "articles": {"all_publications": {"total": 9854, "counts": [639, 683, 698, 720, 769, 872, 1047, 1174, 1256, 1039, 958]}, "ai_publications": {"total": 3455, "counts": [94, 111, 125, 147, 194, 300, 453, 554, 613, 463, 401]}, "ai_publications_growth": {"total": 37, "counts": []}, "highly_cited_ai_pubs": {"total": 834, "counts": [26, 32, 39, 48, 66, 91, 125, 127, 141, 92, 47]}, "ai_pubs_top_conf": {"total": 1317, "counts": [36, 35, 51, 52, 77, 121, 184, 194, 256, 182, 129]}, "ai_citation_counts": {"total": 181424, "counts": [1311, 1956, 2840, 4204, 6428, 10801, 16844, 23981, 31990, 36000, 45068]}, "cv_citation_counts": {"total": 94781, "counts": [573, 843, 1246, 1870, 3106, 5476, 8793, 12323, 16793, 19292, 24466]}, "nlp_citation_counts": {"total": 41688, "counts": [293, 456, 728, 1180, 1682, 2703, 3941, 5504, 7077, 7935, 10190]}, "robotics_citation_counts": {"total": 5878, "counts": [62, 80, 102, 129, 192, 324, 530, 731, 976, 1150, 1601]}, "cv_publications": {"total": 1079, "counts": [27, 33, 38, 42, 57, 86, 131, 162, 198, 162, 144]}, "nlp_publications": {"total": 790, "counts": [22, 25, 29, 33, 41, 67, 110, 136, 147, 106, 74]}, "robotics_publications": {"total": 146, "counts": [3, 4, 4, 6, 7, 12, 19, 22, 26, 23, 20]}, "ai_citations_per_article": {"total": 45, "counts": [13, 14, 16, 20, 24, 28, 29, 35, 45, 92, 182]}, "all_pubs_5yr": {"total": 5118, "counts": []}, "ai_pubs_percent": {"total": 39, "counts": []}, "ai_pubs_last_full_year": {"total": 613, "counts": []}}, "patents": {"ai_patents": {"total": 3187, "counts": [40, 57, 84, 141, 232, 315, 417, 586, 604, 532, 180]}, "ai_patents_growth": {"total": 31, "counts": []}, "ai_patents_grants": {"total": 1674, "counts": []}, "all_patents": {"total": 23013, "counts": [1819, 1771, 1932, 2125, 2135, 2317, 2638, 2635, 2606, 2518, 518]}, "Physical_Sciences_and_Engineering": {"total": 12, "counts": [0, 0, 0, 1, 1, 2, 1, 2, 2, 2, 1]}, "Life_Sciences": {"total": 120, "counts": [2, 3, 4, 8, 13, 14, 20, 22, 18, 13, 4]}, "Security__eg_cybersecurity": {"total": 132, "counts": [2, 3, 3, 6, 13, 18, 21, 25, 23, 17, 3]}, "Transportation": {"total": 181, "counts": [2, 2, 5, 10, 17, 27, 29, 31, 22, 23, 12]}, "Industrial_and_Manufacturing": {"total": 50, "counts": [0, 1, 1, 3, 5, 4, 7, 9, 8, 7, 4]}, "Education": {"total": 21, "counts": [1, 1, 1, 1, 3, 3, 3, 3, 3, 2, 0]}, "Document_Mgt_and_Publishing": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Military": {"total": 0, "counts": [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]}, "Agricultural": {"total": 9, "counts": [0, 0, 0, 1, 1, 1, 1, 2, 1, 2, 0]}, "Computing_in_Government": {"total": 8, "counts": [0, 0, 0, 0, 0, 0, 1, 2, 2, 1, 0]}, "Personal_Devices_and_Computing": {"total": 1793, "counts": [20, 30, 45, 83, 141, 193, 258, 370, 354, 233, 65]}, "Banking_and_Finance": {"total": 55, "counts": [1, 1, 2, 3, 6, 8, 10, 9, 11, 4, 2]}, "Telecommunications": {"total": 530, "counts": [8, 15, 18, 29, 53, 68, 76, 101, 86, 65, 12]}, "Networks__eg_social_IOT_etc": {"total": 57, "counts": [2, 3, 4, 8, 11, 8, 4, 8, 5, 3, 0]}, "Business": {"total": 300, "counts": [7, 10, 13, 24, 36, 38, 40, 54, 44, 28, 7]}, "Energy_Management": {"total": 20, "counts": [1, 1, 0, 1, 2, 2, 2, 3, 4, 4, 1]}, "Entertainment": {"total": 41, "counts": [1, 0, 1, 1, 2, 3, 6, 9, 9, 7, 3]}, "Nanotechnology": {"total": 3, "counts": [0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0]}, "Semiconductors": {"total": 15, "counts": [0, 0, 1, 1, 2, 2, 1, 3, 3, 2, 0]}, "Language_Processing": {"total": 64, "counts": [3, 5, 10, 15, 22, 9, 0, 0, 0, 0, 0]}, "Speech_Processing": {"total": 224, "counts": [4, 4, 6, 11, 20, 25, 32, 45, 42, 29, 6]}, "Knowledge_Representation": {"total": 222, "counts": [8, 10, 11, 18, 34, 34, 31, 31, 25, 17, 3]}, "Planning_and_Scheduling": {"total": 178, "counts": [4, 5, 8, 15, 21, 22, 23, 33, 26, 17, 4]}, "Control": {"total": 157, "counts": [2, 3, 6, 12, 22, 30, 31, 24, 15, 10, 2]}, "Distributed_AI": {"total": 13, "counts": [0, 0, 0, 1, 2, 3, 2, 2, 1, 1, 0]}, "Robotics": {"total": 2, "counts": [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0]}, "Computer_Vision": {"total": 543, "counts": [6, 8, 11, 25, 55, 73, 69, 101, 97, 78, 21]}, "Analytics_and_Algorithms": {"total": 141, "counts": [3, 3, 5, 8, 11, 17, 20, 26, 26, 20, 3]}, "Measuring_and_Testing": {"total": 118, "counts": [2, 2, 4, 7, 11, 17, 19, 24, 16, 13, 3]}, "all_patents_5yr": {"total": 11850, "counts": []}, "ai_patents_percent": {"total": 17, "counts": []}}, "other_metrics": {"tt1_jobs": {"total": 41012, "counts": null}, "ai_jobs": {"total": 2817, "counts": null}}}}, "groupIdOffset": 1000000}
22 changes: 12 additions & 10 deletions web/scripts/retrieve_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -74,8 +74,11 @@

_curr_time = datetime.now()
CURRENT_YEAR = _curr_time.year if _curr_time.month > 6 else _curr_time.year - 1
END_ARTICLE_YEAR = CURRENT_YEAR - 1
END_PATENT_YEAR = CURRENT_YEAR - 3
ARTICLE_OFFSET = 2
PATENT_OFFSET = 3
GROWTH_INTERVAL = 3
END_ARTICLE_YEAR = CURRENT_YEAR - ARTICLE_OFFSET
END_PATENT_YEAR = CURRENT_YEAR - PATENT_OFFSET
YEARS = list(range(CURRENT_YEAR - 10, CURRENT_YEAR + 1))

# Used (along with a check that we never actually meet or exceed this number with legitimate CSET ids)
Expand Down Expand Up @@ -387,15 +390,14 @@ def get_growth(yearly_counts: list, is_patents: bool = False) -> float:
:param is_patents: true if counts are for patents, false otherwise
:return: None; mutates rows
"""
offset = 3 if is_patents else 1
interval = 3
interval_values = yearly_counts[-(interval+1+offset):-1*offset]
offset = PATENT_OFFSET if is_patents else ARTICLE_OFFSET
interval_values = yearly_counts[-(GROWTH_INTERVAL+1+offset):-1*offset]
num_zero_years = sum([value == 0 for value in interval_values[:-1]])
if num_zero_years == interval:
if num_zero_years == GROWTH_INTERVAL:
return None
total_percentage_changes = sum([100*(interval_values[i+1]-interval_values[i])/interval_values[i]
for i in range(interval) if interval_values[i] > 0])
return total_percentage_changes/(interval-num_zero_years)
for i in range(GROWTH_INTERVAL) if interval_values[i] > 0])
return total_percentage_changes/(GROWTH_INTERVAL-num_zero_years)


def clean_country(country: str) -> str:
Expand Down Expand Up @@ -951,9 +953,9 @@ def update_overall_data(group_data: dict) -> None:
average_group_data = get_average_group_data(group_data)
overall_data = {
"years": YEARS,
"startArticleYear": CURRENT_YEAR - 4,
"startArticleYear": CURRENT_YEAR - ARTICLE_OFFSET - GROWTH_INTERVAL,
"endArticleYear": END_ARTICLE_YEAR,
"startPatentYear": CURRENT_YEAR - 6,
"startPatentYear": CURRENT_YEAR - PATENT_OFFSET - GROWTH_INTERVAL,
"endPatentYear": END_PATENT_YEAR,
"groups": average_group_data,
"groupIdOffset": GROUP_OFFSET
Expand Down
Loading

0 comments on commit d0c1749

Please sign in to comment.