Skip to content

Commit fac97d5

Browse files
author
Steve Baskauf
committed
Fixed bug #15
1 parent e4b1ae5 commit fac97d5

6 files changed

Lines changed: 2303 additions & 111 deletions

File tree

publications/data/automate_collect_data.ipynb

Lines changed: 87 additions & 109 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
"cells": [
33
{
44
"cell_type": "code",
5-
"execution_count": 3,
5+
"execution_count": 1,
66
"metadata": {},
77
"outputs": [],
88
"source": [
@@ -236,6 +236,7 @@
236236
"\n",
237237
"def get_file_sha(account, repo, file_path):\n",
238238
" # get the data about the file to get its blob SHA\n",
239+
"\n",
239240
" r = requests.get('https://api.github.com/repos/' + account + '/' + repo + '/contents/' + file_path)\n",
240241
" file_data = r.json()\n",
241242
" try:\n",
@@ -502,65 +503,9 @@
502503
"name": "stdout",
503504
"output_type": "stream",
504505
"text": [
505-
"Time checked: 2020-08-27T10:33:18.706690\n",
506-
"Date last run: 2020-08-27\n",
507-
"UTC date now is: 2020-08-27\n",
508-
"\n",
509-
"Time checked: 2020-08-27T11:33:19.173854\n",
510-
"Date last run: 2020-08-27\n",
511-
"UTC date now is: 2020-08-27\n",
512-
"\n",
513-
"Time checked: 2020-08-27T12:33:19.920486\n",
514-
"Date last run: 2020-08-27\n",
515-
"UTC date now is: 2020-08-27\n",
516-
"\n",
517-
"Time checked: 2020-08-27T13:33:20.599188\n",
518-
"Date last run: 2020-08-27\n",
519-
"UTC date now is: 2020-08-27\n",
520-
"\n",
521-
"Time checked: 2020-08-27T14:33:21.165710\n",
522-
"Date last run: 2020-08-27\n",
523-
"UTC date now is: 2020-08-27\n",
524-
"\n",
525-
"Time checked: 2020-08-27T15:33:21.793703\n",
526-
"Date last run: 2020-08-27\n",
527-
"UTC date now is: 2020-08-27\n",
528-
"\n",
529-
"Time checked: 2020-08-27T16:33:22.378751\n",
530-
"Date last run: 2020-08-27\n",
531-
"UTC date now is: 2020-08-27\n",
532-
"\n",
533-
"Time checked: 2020-08-27T17:33:23.047082\n",
534-
"Date last run: 2020-08-27\n",
535-
"UTC date now is: 2020-08-27\n",
536-
"\n",
537-
"Time checked: 2020-08-27T18:33:23.696642\n",
538-
"Date last run: 2020-08-27\n",
539-
"UTC date now is: 2020-08-27\n",
540-
"\n",
541-
"Time checked: 2020-08-27T19:33:24.308007\n",
542-
"Date last run: 2020-08-27\n",
543-
"UTC date now is: 2020-08-27\n",
544-
"\n",
545-
"Time checked: 2020-08-27T20:33:24.927389\n",
546-
"Date last run: 2020-08-27\n",
547-
"UTC date now is: 2020-08-27\n",
548-
"\n",
549-
"Time checked: 2020-08-27T21:33:25.607699\n",
550-
"Date last run: 2020-08-27\n",
551-
"UTC date now is: 2020-08-27\n",
552-
"\n",
553-
"Time checked: 2020-08-27T22:33:26.245749\n",
554-
"Date last run: 2020-08-27\n",
555-
"UTC date now is: 2020-08-27\n",
556-
"\n",
557-
"Time checked: 2020-08-27T23:33:26.893207\n",
558-
"Date last run: 2020-08-27\n",
559-
"UTC date now is: 2020-08-27\n",
560-
"\n",
561-
"Time checked: 2020-08-28T00:33:27.552136\n",
562-
"Date last run: 2020-08-27\n",
563-
"UTC date now is: 2020-08-28\n",
506+
"Time checked: 2020-11-06T03:15:18.788940\n",
507+
"Date last run: 2020-11-05\n",
508+
"UTC date now is: 2020-11-06\n",
564509
"Item counts (university-wide):\n",
565510
"vu_total\n",
566511
"vu_men\n",
@@ -569,23 +514,23 @@
569514
"vu_works\n",
570515
"vu_men_works\n",
571516
"vu_women_works\n",
572-
"{'commit': Commit(sha=\"158b18eed2c2505d69acd4ba982ad8e6690e0515\"), 'content': ContentFile(path=\"publications/data/vandycite_item_data.csv\")}\n",
517+
"{'commit': Commit(sha=\"2e57032bb9ffeffc364dd8e39b0def074d771de6\"), 'content': ContentFile(path=\"publications/data/vandycite_item_data.csv\")}\n",
573518
"\n",
574519
"Item counts by unit:\n",
575520
"units_total\n",
576-
"{'commit': Commit(sha=\"64f9885339e47c75d3743a7fab3dc7c342b056a1\"), 'content': ContentFile(path=\"publications/data/units_total.csv\")}\n",
521+
"{'commit': Commit(sha=\"eed46c0f71cf5c01f0514f026ecc60aae9359f73\"), 'content': ContentFile(path=\"publications/data/units_total.csv\")}\n",
577522
"units_women\n",
578-
"{'commit': Commit(sha=\"87ae9755e240307a262c8a1bcf88248fe45195df\"), 'content': ContentFile(path=\"publications/data/units_women.csv\")}\n",
523+
"{'commit': Commit(sha=\"e0a830292595d16fc70062d5496de3faa614e360\"), 'content': ContentFile(path=\"publications/data/units_women.csv\")}\n",
579524
"units_men\n",
580-
"{'commit': Commit(sha=\"8207a2c93699bdc5a6a966ef5f9e664253d157f7\"), 'content': ContentFile(path=\"publications/data/units_men.csv\")}\n",
525+
"{'commit': Commit(sha=\"050330cc3f4922e777addd2b62d83aeb3ba97c37\"), 'content': ContentFile(path=\"publications/data/units_men.csv\")}\n",
581526
"units_orcid\n",
582-
"{'commit': Commit(sha=\"2d0f304486b8b9144711606a251ca22e2e6b8df6\"), 'content': ContentFile(path=\"publications/data/units_orcid.csv\")}\n",
527+
"{'commit': Commit(sha=\"2433f14038ea256ad01d2a125e218aa3e5de60cb\"), 'content': ContentFile(path=\"publications/data/units_orcid.csv\")}\n",
583528
"units_works\n",
584-
"{'commit': Commit(sha=\"8188080a645155e24d04b83b0e0c190ba913d363\"), 'content': ContentFile(path=\"publications/data/units_works.csv\")}\n",
529+
"{'commit': Commit(sha=\"654dbe19490f36091c22a2113b28ea1ddd517915\"), 'content': ContentFile(path=\"publications/data/units_works.csv\")}\n",
585530
"units_works_men\n",
586-
"{'commit': Commit(sha=\"312a83c408b128968875aff54c864c7de7edb1ba\"), 'content': ContentFile(path=\"publications/data/units_works_men.csv\")}\n",
531+
"{'commit': Commit(sha=\"5ac8915da98f00a8ce20afa0c2807462ca318fa4\"), 'content': ContentFile(path=\"publications/data/units_works_men.csv\")}\n",
587532
"units_works_women\n",
588-
"{'commit': Commit(sha=\"37c6066f1ec9b3c0871680af1312485778c6b811\"), 'content': ContentFile(path=\"publications/data/units_works_women.csv\")}\n",
533+
"{'commit': Commit(sha=\"bf66bb23be7ff82a5db3bd21d8e195d2888caa47\"), 'content': ContentFile(path=\"publications/data/units_works_women.csv\")}\n",
589534
"\n",
590535
"Contributions\n",
591536
"Clifford_Anderson\n",
@@ -601,52 +546,80 @@
601546
"Charlotte_Y._Lew\n",
602547
"KukanaLuika\n",
603548
"VanderBot\n",
604-
"{'commit': Commit(sha=\"741ffda6a2ef03dfdfd85996257dd7392afa8ed8\"), 'content': ContentFile(path=\"publications/data/vandycite_edit_data.csv\")}\n",
549+
"{'commit': Commit(sha=\"a9c52d7a20a461f5adb53d5fa18dba8ef6df23e8\"), 'content': ContentFile(path=\"publications/data/vandycite_edit_data.csv\")}\n",
605550
"done\n",
606551
"\n",
607-
"Time checked: 2020-08-28T01:34:14.072478\n",
608-
"Date last run: 2020-08-28\n",
609-
"UTC date now is: 2020-08-28\n",
552+
"Time checked: 2020-11-06T04:19:10.748400\n",
553+
"Date last run: 2020-11-06\n",
554+
"UTC date now is: 2020-11-06\n",
610555
"\n",
611-
"Time checked: 2020-08-28T02:34:14.799416\n",
612-
"Date last run: 2020-08-28\n",
613-
"UTC date now is: 2020-08-28\n",
556+
"Time checked: 2020-11-06T05:19:11.180033\n",
557+
"Date last run: 2020-11-06\n",
558+
"UTC date now is: 2020-11-06\n",
614559
"\n",
615-
"Time checked: 2020-08-28T03:34:15.405621\n",
616-
"Date last run: 2020-08-28\n",
617-
"UTC date now is: 2020-08-28\n",
560+
"Time checked: 2020-11-06T06:19:11.990439\n",
561+
"Date last run: 2020-11-06\n",
562+
"UTC date now is: 2020-11-06\n",
618563
"\n",
619-
"Time checked: 2020-08-28T10:39:24.013756\n",
620-
"Date last run: 2020-08-28\n",
621-
"UTC date now is: 2020-08-28\n",
564+
"Time checked: 2020-11-06T07:19:12.513036\n",
565+
"Date last run: 2020-11-06\n",
566+
"UTC date now is: 2020-11-06\n",
622567
"\n",
623-
"Time checked: 2020-08-28T11:39:24.522399\n",
624-
"Date last run: 2020-08-28\n",
625-
"UTC date now is: 2020-08-28\n",
568+
"Time checked: 2020-11-06T08:19:12.948859\n",
569+
"Date last run: 2020-11-06\n",
570+
"UTC date now is: 2020-11-06\n",
626571
"\n",
627-
"Time checked: 2020-08-28T12:39:25.193728\n",
628-
"Date last run: 2020-08-28\n",
629-
"UTC date now is: 2020-08-28\n",
572+
"Time checked: 2020-11-06T09:19:13.860337\n",
573+
"Date last run: 2020-11-06\n",
574+
"UTC date now is: 2020-11-06\n",
630575
"\n",
631-
"Time checked: 2020-08-28T13:39:25.845848\n",
632-
"Date last run: 2020-08-28\n",
633-
"UTC date now is: 2020-08-28\n",
576+
"Time checked: 2020-11-06T10:19:14.225606\n",
577+
"Date last run: 2020-11-06\n",
578+
"UTC date now is: 2020-11-06\n",
634579
"\n",
635-
"Time checked: 2020-08-28T14:39:26.741993\n",
636-
"Date last run: 2020-08-28\n",
637-
"UTC date now is: 2020-08-28\n",
580+
"Time checked: 2020-11-06T11:19:14.591934\n",
581+
"Date last run: 2020-11-06\n",
582+
"UTC date now is: 2020-11-06\n",
638583
"\n",
639-
"Time checked: 2020-08-28T15:39:27.243755\n",
640-
"Date last run: 2020-08-28\n",
641-
"UTC date now is: 2020-08-28\n",
584+
"Time checked: 2020-11-06T12:19:15.446802\n",
585+
"Date last run: 2020-11-06\n",
586+
"UTC date now is: 2020-11-06\n",
642587
"\n",
643-
"Time checked: 2020-08-28T16:39:27.900316\n",
644-
"Date last run: 2020-08-28\n",
645-
"UTC date now is: 2020-08-28\n",
588+
"Time checked: 2020-11-06T13:19:15.850560\n",
589+
"Date last run: 2020-11-06\n",
590+
"UTC date now is: 2020-11-06\n",
646591
"\n",
647-
"Time checked: 2020-08-28T17:39:28.563831\n",
648-
"Date last run: 2020-08-28\n",
649-
"UTC date now is: 2020-08-28\n",
592+
"Time checked: 2020-11-06T14:19:16.272968\n",
593+
"Date last run: 2020-11-06\n",
594+
"UTC date now is: 2020-11-06\n",
595+
"\n",
596+
"Time checked: 2020-11-06T15:19:16.839250\n",
597+
"Date last run: 2020-11-06\n",
598+
"UTC date now is: 2020-11-06\n",
599+
"\n",
600+
"Time checked: 2020-11-06T16:19:17.245462\n",
601+
"Date last run: 2020-11-06\n",
602+
"UTC date now is: 2020-11-06\n",
603+
"\n",
604+
"Time checked: 2020-11-06T17:19:17.712122\n",
605+
"Date last run: 2020-11-06\n",
606+
"UTC date now is: 2020-11-06\n",
607+
"\n",
608+
"Time checked: 2020-11-06T18:19:18.132463\n",
609+
"Date last run: 2020-11-06\n",
610+
"UTC date now is: 2020-11-06\n",
611+
"\n",
612+
"Time checked: 2020-11-06T19:19:18.566989\n",
613+
"Date last run: 2020-11-06\n",
614+
"UTC date now is: 2020-11-06\n",
615+
"\n",
616+
"Time checked: 2020-11-06T20:19:18.974711\n",
617+
"Date last run: 2020-11-06\n",
618+
"UTC date now is: 2020-11-06\n",
619+
"\n",
620+
"Time checked: 2020-11-06T21:19:19.486808\n",
621+
"Date last run: 2020-11-06\n",
622+
"UTC date now is: 2020-11-06\n",
650623
"\n"
651624
]
652625
}
@@ -708,13 +681,6 @@
708681
" sleep(3600)"
709682
]
710683
},
711-
{
712-
"cell_type": "code",
713-
"execution_count": null,
714-
"metadata": {},
715-
"outputs": [],
716-
"source": []
717-
},
718684
{
719685
"cell_type": "code",
720686
"execution_count": null,
@@ -728,6 +694,18 @@
728694
"display_name": "Python 3",
729695
"language": "python",
730696
"name": "python3"
697+
},
698+
"language_info": {
699+
"codemirror_mode": {
700+
"name": "ipython",
701+
"version": 3
702+
},
703+
"file_extension": ".py",
704+
"mimetype": "text/x-python",
705+
"name": "python",
706+
"nbconvert_exporter": "python",
707+
"pygments_lexer": "ipython3",
708+
"version": "3.7.1"
731709
}
732710
},
733711
"nbformat": 4,

vanderbot/bluffton.csv

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
department,wikidataId,name,labelEn,alias,description,orcidStatementUuid,orcid,orcidReferenceHash,orcidReferenceValue_nodeId,orcidReferenceValue_val,orcidReferenceValue_prec,employerStatementUuid,employer,employerReferenceHash,employerReferenceSourceUrl,employerReferenceRetrieved_nodeId,employerReferenceRetrieved_val,employerReferenceRetrieved_prec,affiliationStatementUuid,affiliation,affiliationReferenceHash,affiliationReferenceSourceUrl,affiliationReferenceRetrieved_nodeId,affiliationReferenceRetrieved_val,affiliationReferenceRetrieved_prec,instanceOfUuid,instanceOf,sexOrGenderUuid,sexOrGenderQId,gender,degree,category,wikidataStatus,role
2+
,Q101242973,Paul Neufeld Weaver,Paul Neufeld Weaver,"[""Paul Weaver""]",education professor,,,,,,,B1C8035C-9734-42A3-8F13-E38DB782B7E5,Q886141,2c1963b96bde00545c55c48774c2aa8d09c47a97,https://www.bluffton.edu/catalog/officers/faculty.aspx,411d7f31-d6d4-4dde-b01c-d20eff6eec14,2020-11-06T00:00:00Z,11,,,,,,,,C54E865E-79C2-4B67-B7D1-9F357340D735,Q5,2BDAA90F-B0FF-4EDE-9963-3E771E00338B,Q6581097,,,,,

0 commit comments

Comments
 (0)