|
| 1 | +/* |
| 2 | +See LXL-3739 for more info. |
| 3 | +
|
| 4 | +URI for <label> obtained from location response header of "curl -I -o headers -s ${url}" |
| 5 | +where url="https://id.loc.gov/authorities/subjectheadings/label/<label>" |
| 6 | +
|
| 7 | +Manually edited (spelling mistakes etc): |
| 8 | +
|
| 9 | +Darkwawe (music) -> Darkwave (Music) (in pm14bfp71ldshtn) |
| 10 | +Taraab -> Taraab (Music) (in wt7bjpmf1s02t5n) |
| 11 | +Occational verse -> Occasional verse (in khw087h30db2179) |
| 12 | +Alternative histories (fiction) -> Alternative histories (Fiction) (in 0xbdhl4j3g28rlz) |
| 13 | +Straight-edge -> Straight-edge (Music) (in 42gkrt7n4r3cqv8) |
| 14 | +Indians Music -> Indians--Music (in 86lpwfvs37m8dj2) |
| 15 | +Minutes (records) -> Minutes (Records) (in 0xbfnmfj240rck1) |
| 16 | +
|
| 17 | +*/ |
| 18 | + |
| 19 | +import whelk.util.DocumentUtil |
| 20 | + |
| 21 | +LABEL_TO_URI = ["Action and adventure fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026217", |
| 22 | + "Administrative regulations" : "https://id.loc.gov/authorities/genreForms/gf2011026030", |
| 23 | + "Aeolian harp" : "https://id.loc.gov/authorities/subjects/sh85001245", |
| 24 | + "Allegories" : "https://id.loc.gov/authorities/childrensSubjects/sj2021051655", |
| 25 | + "Alternative histories (fiction)" : "https://id.loc.gov/authorities/genreForms/gf2014026220.html", |
| 26 | + "Arthurian romances" : "https://id.loc.gov/authorities/childrensSubjects/sj96006040", |
| 27 | + "Audiobooks" : "https://id.loc.gov/authorities/genreForms/gf2011026063", |
| 28 | + "Autobiographical fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026231", |
| 29 | + "Ballets" : "https://id.loc.gov/authorities/childrensSubjects/sj2021051575", |
| 30 | + "Bible fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026240", |
| 31 | + "Bible stories" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050145", |
| 32 | + "Bibliographies" : "https://id.loc.gov/authorities/genreForms/gf2014026048", |
| 33 | + "Bildungsromans" : "https://id.loc.gov/authorities/genreForms/gf2014026243", |
| 34 | + "Biographical fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026246", |
| 35 | + "Bowing (Musical instruments)" : "https://id.loc.gov/authorities/subjects/sh2005003308", |
| 36 | + "Burlesques (Literature)" : "https://id.loc.gov/authorities/genreForms/gf2014026254", |
| 37 | + "By-laws" : "https://id.loc.gov/authorities/genreForms/gf2011026104", |
| 38 | + "Catalogues raisonnés" : "https://id.loc.gov/authorities/genreForms/gf2014026058", |
| 39 | + "Christian literature, Early" : "https://id.loc.gov/authorities/subjects/sh85025115", |
| 40 | + "Comics (Graphic works)" : "https://id.loc.gov/authorities/genreForms/gf2014026266", |
| 41 | + "Concerts" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050694", |
| 42 | + "Cyberpunk fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026275", |
| 43 | + "Darkwawe (music)" : "https://id.loc.gov/authorities/genreForms/gf2014026759.html", |
| 44 | + "Detective and mystery fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026280", |
| 45 | + "Dialect fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026283", |
| 46 | + "Diary fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026286", |
| 47 | + "Domestic fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026295", |
| 48 | + "Double bass" : "https://id.loc.gov/authorities/childrensSubjects/sj2021060177", |
| 49 | + "Drama" : "https://id.loc.gov/authorities/childrensSubjects/sj96005303", |
| 50 | + "Dystopian fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026302", |
| 51 | + "Epic fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026309", |
| 52 | + "Epistolary fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026314", |
| 53 | + "Erotic fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026320", |
| 54 | + "Essays" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050651", |
| 55 | + "Experimental fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026325", |
| 56 | + "Fables" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050019", |
| 57 | + "Fairy tales" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050020", |
| 58 | + "Fakebooks (Music)" : "https://id.loc.gov/authorities/genreForms/gf2014026798", |
| 59 | + "Fan fiction" : "https://id.loc.gov/authorities/childrensSubjects/sj2021061311", |
| 60 | + "Fantasy fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026333", |
| 61 | + "Flash fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026543", |
| 62 | + "Folk literature" : "https://id.loc.gov/authorities/childrensSubjects/sj2021055518", |
| 63 | + "Folk tales" : "https://id.loc.gov/authorities/genreForms/gf2014026344", |
| 64 | + "Frame stories" : "https://id.loc.gov/authorities/genreForms/gf2014026347", |
| 65 | + "Gay erotic fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026320", |
| 66 | + "Ghost stories" : "https://id.loc.gov/authorities/genreForms/gf2014026357", |
| 67 | + "Gothic fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026360", |
| 68 | + "Graphic novels" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050898", |
| 69 | + "Guitar" : "https://id.loc.gov/authorities/childrensSubjects/sj2021052979", |
| 70 | + "Historical fiction" : "https://id.loc.gov/authorities/childrensSubjects/sj2021056047", |
| 71 | + "Horror fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026373", |
| 72 | + "Humor" : "https://id.loc.gov/authorities/childrensSubjects/sj2020050021", |
| 73 | + "Indians Music" : "https://id.loc.gov/authorities/subjects/sh85065058.html", |
| 74 | + "Legends" : "https://id.loc.gov/authorities/childrensSubjects/sj2021060180", |
| 75 | + "Library catalogs" : "https://id.loc.gov/authorities/genreForms/gf2015026003", |
| 76 | + "Literature" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050024", |
| 77 | + "Magic realist fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026424", |
| 78 | + "Mass (Music)" : "https://id.loc.gov/authorities/subjects/sh85081852", |
| 79 | + "Masses" : "https://id.loc.gov/authorities/genreForms/gf2014026926", |
| 80 | + "Minutes (records)" : "https://id.loc.gov/authorities/genreForms/gf2014026128.html", |
| 81 | + "Motion pictures" : "https://id.loc.gov/authorities/childrensSubjects/sj2021051639", |
| 82 | + "National songs" : "https://id.loc.gov/authorities/childrensSubjects/sj2021058378", |
| 83 | + "Noir fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026452", |
| 84 | + "Nonfiction novels" : "https://id.loc.gov/authorities/genreForms/gf2014026454", |
| 85 | + "Novels" : "https://id.loc.gov/authorities/genreForms/gf2015026020", |
| 86 | + "Nursery rhymes" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050023", |
| 87 | + "Occational verse" : "https://id.loc.gov/authorities/genreForms/gf2014026460.html", |
| 88 | + "Octets" : "https://id.loc.gov/authorities/subjects/sh85093983", |
| 89 | + "Odes" : "https://id.loc.gov/authorities/genreForms/gf2014026461", |
| 90 | + "Organ (Musical instrument)" : "https://id.loc.gov/authorities/childrensSubjects/sj2021058121", |
| 91 | + "Parodies (Literature)" : "https://id.loc.gov/authorities/genreForms/gf2014026470", |
| 92 | + "Picaresque fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026479", |
| 93 | + "Political fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026482", |
| 94 | + "Psychological fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026492", |
| 95 | + "Puns" : "https://id.loc.gov/authorities/genreForms/gf2014026157", |
| 96 | + "Recreational works" : "https://id.loc.gov/authorities/genreForms/gf2014026164", |
| 97 | + "Religious fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026502", |
| 98 | + "Reviews" : "https://id.loc.gov/authorities/genreForms/gf2014026168", |
| 99 | + "Robinsonades" : "https://id.loc.gov/authorities/genreForms/gf2014026514", |
| 100 | + "Romance fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026516", |
| 101 | + "Romance films" : "https://id.loc.gov/authorities/genreForms/gf2011026543", |
| 102 | + "Romances" : "https://id.loc.gov/authorities/genreForms/gf2014026517", |
| 103 | + "Romans à clef" : "https://id.loc.gov/authorities/genreForms/gf2014026518", |
| 104 | + "Romantic comedy films" : "https://id.loc.gov/authorities/genreForms/gf2011026545", |
| 105 | + "Sagas" : "https://id.loc.gov/authorities/childrensSubjects/sj2021058029", |
| 106 | + "Satirical literature" : "https://id.loc.gov/authorities/genreForms/gf2014026525", |
| 107 | + "Science fiction" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050042", |
| 108 | + "Sentimental novels" : "https://id.loc.gov/authorities/genreForms/gf2014026536", |
| 109 | + "Serialized fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026537", |
| 110 | + "Short stories" : "https://id.loc.gov/authorities/childrensSubjects/sj98000354", |
| 111 | + "Space operas" : "https://id.loc.gov/authorities/genreForms/gf2014026551", |
| 112 | + "Sprechstimme" : "https://id.loc.gov/authorities/subjects/sh2008000832", |
| 113 | + "Steampunk fiction" : "https://id.loc.gov/authorities/childrensSubjects/sj2021061324", |
| 114 | + "Stories in rhyme" : "https://id.loc.gov/authorities/childrensSubjects/sj2021050017", |
| 115 | + "Straight-edge" : "https://id.loc.gov/authorities/subjects/sh2003002058.html", |
| 116 | + "Strathspeys" : "https://id.loc.gov/authorities/subjects/sh85128520", |
| 117 | + "String octets" : "https://id.loc.gov/authorities/subjects/sh85129020", |
| 118 | + "Swamp pop music" : "https://id.loc.gov/authorities/genreForms/gf2014027118", |
| 119 | + "Symphonic poems" : "https://id.loc.gov/authorities/genreForms/gf2014027120", |
| 120 | + "Taarab" : "https://id.loc.gov/authorities/genreForms/gf2014027123.html", |
| 121 | + "Talking books" : "https://id.loc.gov/authorities/childrensSubjects/sj2021057301", |
| 122 | + "Tall tales" : "https://id.loc.gov/authorities/childrensSubjects/sj2021051578", |
| 123 | + "Tango" : "https://id.loc.gov/authorities/names/n96122416", |
| 124 | + "Te Deum laudamus" : "https://id.loc.gov/resources/hubs/46c964fa-238c-5179-795b-b8975adb8a34", |
| 125 | + "Thrillers (Fiction)" : "https://id.loc.gov/authorities/genreForms/gf2014026571", |
| 126 | + "Ukulele" : "https://id.loc.gov/authorities/childrensSubjects/sj2021053032", |
| 127 | + "Utopian fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026583", |
| 128 | + "Violoncello" : "https://id.loc.gov/authorities/names/n42026083", |
| 129 | + "War fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026590", |
| 130 | + "Western fiction" : "https://id.loc.gov/authorities/genreForms/gf2014026594", |
| 131 | + "Woodwind quartets (Saxophones (4))": "https://id.loc.gov/authorities/subjects/sh85147995"] |
| 132 | + |
| 133 | +selectByCollection('auth') { auth -> |
| 134 | + def data = auth.doc.data |
| 135 | + if (!data['@graph'][1].inScheme?.'@id'?.equals("https://id.kb.se/term/saogf")) { |
| 136 | + return |
| 137 | + } |
| 138 | + DocumentUtil.traverse(auth.doc.data, { value, path -> |
| 139 | + if (value instanceof Map && value.inScheme?.'@id'?.equals("https://id.kb.se/term/lcsh") && value.prefLabel) { |
| 140 | + incrementStats(value.prefLabel, path) |
| 141 | + auth.scheduleSave() |
| 142 | + return new DocumentUtil.Replace(['@id': LABEL_TO_URI[value.prefLabel]]) |
| 143 | + } |
| 144 | + }) |
| 145 | +} |
0 commit comments