@internetarchive/collection-browser 2.8.1-alpha-webdev7002.3 → 2.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,11 +1,27 @@
1
- const TEXTS = { facets: [{ facetType: 'mediatype', bucketKey: 'texts' }] };
2
- const AUDIO = { facets: [{ facetType: 'mediatype', bucketKey: 'audio' }] };
3
- const MOVIES = { facets: [{ facetType: 'mediatype', bucketKey: 'movies' }] };
4
- const IMAGE = { facets: [{ facetType: 'mediatype', bucketKey: 'image' }] };
5
- const SOFTWARE = { facets: [{ facetType: 'mediatype', bucketKey: 'software' }] };
6
- const ETREE = { facets: [{ facetType: 'mediatype', bucketKey: 'etree' }] };
7
- const WEB = { facets: [{ facetType: 'mediatype', bucketKey: 'web' }] };
8
- const DATA = { facets: [{ facetType: 'mediatype', bucketKey: 'data' }] };
1
+ const TEXTS = {
2
+ facets: [{ facetType: 'mediatype', bucketKey: 'texts' }],
3
+ };
4
+ const AUDIO = {
5
+ facets: [{ facetType: 'mediatype', bucketKey: 'audio' }],
6
+ };
7
+ const MOVIES = {
8
+ facets: [{ facetType: 'mediatype', bucketKey: 'movies' }],
9
+ };
10
+ const IMAGE = {
11
+ facets: [{ facetType: 'mediatype', bucketKey: 'image' }],
12
+ };
13
+ const SOFTWARE = {
14
+ facets: [{ facetType: 'mediatype', bucketKey: 'software' }],
15
+ };
16
+ const ETREE = {
17
+ facets: [{ facetType: 'mediatype', bucketKey: 'etree' }],
18
+ };
19
+ const WEB = {
20
+ facets: [{ facetType: 'mediatype', bucketKey: 'web' }],
21
+ };
22
+ const DATA = {
23
+ facets: [{ facetType: 'mediatype', bucketKey: 'data' }],
24
+ };
9
25
  /**
10
26
  * Map from keywords found in the search query to an array of
11
27
  * likely-relevant "smart facets" for those keywords.
@@ -1 +1 @@
1
- {"version":3,"file":"query-keywords-map.js","sourceRoot":"","sources":["../../../../../../src/collection-facets/smart-facets/heuristics/query-keywords/query-keywords-map.ts"],"names":[],"mappings":"AAEA,MAAM,KAAK,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,EAAE,CAAC;AACvF,MAAM,KAAK,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,EAAE,CAAC;AACvF,MAAM,MAAM,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,QAAQ,EAAE,CAAC,EAAE,CAAC;AACzF,MAAM,KAAK,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,EAAE,CAAC;AACvF,MAAM,QAAQ,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,UAAU,EAAE,CAAC,EAAE,CAAC;AAC7F,MAAM,KAAK,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,EAAE,CAAC;AACvF,MAAM,GAAG,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC,EAAE,CAAC;AACnF,MAAM,IAAI,GAAe,EAAE,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,MAAM,EAAE,CAAC,EAAE,CAAC;AAErF;;;GAGG;AACH,MAAM,CAAC,MAAM,cAAc,GAA8B;IACvD,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,QAAQ,EAAE,CAAC,KAAK,CAAC;IACjB,SAAS,EAAE,CAAC,KAAK,CAAC;IAClB,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,MAAM,EAAE,CAAC,KAAK,CAAC;IACf,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,MAAM,EAAE,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,KAAK,EAAE,CAAC,MAAM,CAAC;IACf,KAAK,EAAE,CAAC,MAAM,CAAC;IACf,IAAI,EAAE,CAAC,MAAM,CAAC;IACd,SAAS,EAAE,CAAC,MAAM,CAAC;IACnB,OAAO,EAAE,CAAC,MAAM,CAAC;IACjB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,QAAQ,EAAE,CAAC,KAAK,CAAC;IACjB,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,QAAQ,EAAE,CAAC,QAAQ,CAAC;IACpB,GAAG,EAAE,CAAC,QAAQ,CAAC;IACf,OAAO,EAAE,CAAC,QAAQ,CAAC;IACnB,IAAI,EAAE,CAAC,QAAQ,CAAC;IAChB,MAAM,EAAE,CAAC,QAAQ,CAAC;IAClB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,YAAY,EAAE,CAAC,KAAK,CAAC;IACrB,WAAW,EAAE,CAAC,GAAG,CAAC;IAClB,OAAO,EAAE,CAAC,IAAI,CAAC;CAChB,CAAC","sourcesContent":["import type { KeywordFacetMap, SmartFacet } from '../../models';\n\nconst TEXTS: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'texts' }] };\nconst AUDIO: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'audio' }] };\nconst MOVIES: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'movies' }] };\nconst IMAGE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'image' }] };\nconst SOFTWARE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'software' }] };\nconst ETREE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'etree' }] };\nconst WEB: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'web' }] };\nconst DATA: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'data' }] };\n\n/**\n * Map from keywords found in the search query to an array of\n * likely-relevant \"smart facets\" for those keywords.\n */\nexport const QUERY_KEYWORDS: Readonly<KeywordFacetMap> = {\n text: [TEXTS],\n book: [TEXTS],\n novel: [TEXTS],\n magazine: [TEXTS],\n newspaper: [TEXTS],\n pdf: [TEXTS],\n epub: [TEXTS],\n audio: [AUDIO],\n song: [AUDIO],\n music: [AUDIO],\n listen: [AUDIO],\n podcast: [AUDIO],\n radio: [AUDIO],\n stream: [AUDIO, MOVIES],\n video: [MOVIES],\n movie: [MOVIES],\n film: [MOVIES],\n animation: [MOVIES],\n youtube: [MOVIES],\n image: [IMAGE],\n photo: [IMAGE],\n picture: [IMAGE],\n painting: [IMAGE],\n jpg: [IMAGE],\n jpeg: [IMAGE],\n png: [IMAGE],\n gif: [IMAGE],\n software: [SOFTWARE],\n app: [SOFTWARE],\n program: [SOFTWARE],\n game: [SOFTWARE],\n arcade: [SOFTWARE],\n etree: [ETREE],\n concert: [ETREE],\n 'live music': [ETREE],\n 'web crawl': [WEB],\n dataset: [DATA],\n};\n"]}
1
+ {"version":3,"file":"query-keywords-map.js","sourceRoot":"","sources":["../../../../../../src/collection-facets/smart-facets/heuristics/query-keywords/query-keywords-map.ts"],"names":[],"mappings":"AAEA,MAAM,KAAK,GAAe;IACxB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC;CACzD,CAAC;AACF,MAAM,KAAK,GAAe;IACxB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC;CACzD,CAAC;AACF,MAAM,MAAM,GAAe;IACzB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,QAAQ,EAAE,CAAC;CAC1D,CAAC;AACF,MAAM,KAAK,GAAe;IACxB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC;CACzD,CAAC;AACF,MAAM,QAAQ,GAAe;IAC3B,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,UAAU,EAAE,CAAC;CAC5D,CAAC;AACF,MAAM,KAAK,GAAe;IACxB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC;CACzD,CAAC;AACF,MAAM,GAAG,GAAe;IACtB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,KAAK,EAAE,CAAC;CACvD,CAAC;AACF,MAAM,IAAI,GAAe;IACvB,MAAM,EAAE,CAAC,EAAE,SAAS,EAAE,WAAW,EAAE,SAAS,EAAE,MAAM,EAAE,CAAC;CACxD,CAAC;AAEF;;;GAGG;AACH,MAAM,CAAC,MAAM,cAAc,GAA8B;IACvD,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,QAAQ,EAAE,CAAC,KAAK,CAAC;IACjB,SAAS,EAAE,CAAC,KAAK,CAAC;IAClB,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,MAAM,EAAE,CAAC,KAAK,CAAC;IACf,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,MAAM,EAAE,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,KAAK,EAAE,CAAC,MAAM,CAAC;IACf,KAAK,EAAE,CAAC,MAAM,CAAC;IACf,IAAI,EAAE,CAAC,MAAM,CAAC;IACd,SAAS,EAAE,CAAC,MAAM,CAAC;IACnB,OAAO,EAAE,CAAC,MAAM,CAAC;IACjB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,QAAQ,EAAE,CAAC,KAAK,CAAC;IACjB,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,IAAI,EAAE,CAAC,KAAK,CAAC;IACb,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,GAAG,EAAE,CAAC,KAAK,CAAC;IACZ,QAAQ,EAAE,CAAC,QAAQ,CAAC;IACpB,GAAG,EAAE,CAAC,QAAQ,CAAC;IACf,OAAO,EAAE,CAAC,QAAQ,CAAC;IACnB,IAAI,EAAE,CAAC,QAAQ,CAAC;IAChB,MAAM,EAAE,CAAC,QAAQ,CAAC;IAClB,KAAK,EAAE,CAAC,KAAK,CAAC;IACd,OAAO,EAAE,CAAC,KAAK,CAAC;IAChB,YAAY,EAAE,CAAC,KAAK,CAAC;IACrB,WAAW,EAAE,CAAC,GAAG,CAAC;IAClB,OAAO,EAAE,CAAC,IAAI,CAAC;CAChB,CAAC","sourcesContent":["import type { KeywordFacetMap, SmartFacet } from '../../models';\n\nconst TEXTS: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'texts' }],\n};\nconst AUDIO: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'audio' }],\n};\nconst MOVIES: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'movies' }],\n};\nconst IMAGE: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'image' }],\n};\nconst SOFTWARE: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'software' }],\n};\nconst ETREE: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'etree' }],\n};\nconst WEB: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'web' }],\n};\nconst DATA: SmartFacet = {\n facets: [{ facetType: 'mediatype', bucketKey: 'data' }],\n};\n\n/**\n * Map from keywords found in the search query to an array of\n * likely-relevant \"smart facets\" for those keywords.\n */\nexport const QUERY_KEYWORDS: Readonly<KeywordFacetMap> = {\n text: [TEXTS],\n book: [TEXTS],\n novel: [TEXTS],\n magazine: [TEXTS],\n newspaper: [TEXTS],\n pdf: [TEXTS],\n epub: [TEXTS],\n audio: [AUDIO],\n song: [AUDIO],\n music: [AUDIO],\n listen: [AUDIO],\n podcast: [AUDIO],\n radio: [AUDIO],\n stream: [AUDIO, MOVIES],\n video: [MOVIES],\n movie: [MOVIES],\n film: [MOVIES],\n animation: [MOVIES],\n youtube: [MOVIES],\n image: [IMAGE],\n photo: [IMAGE],\n picture: [IMAGE],\n painting: [IMAGE],\n jpg: [IMAGE],\n jpeg: [IMAGE],\n png: [IMAGE],\n gif: [IMAGE],\n software: [SOFTWARE],\n app: [SOFTWARE],\n program: [SOFTWARE],\n game: [SOFTWARE],\n arcade: [SOFTWARE],\n etree: [ETREE],\n concert: [ETREE],\n 'live music': [ETREE],\n 'web crawl': [WEB],\n dataset: [DATA],\n};\n"]}
@@ -52,24 +52,18 @@ export class WikidataHeuristic {
52
52
  * @inheritdoc
53
53
  */
54
54
  async getRecommendedFacets(query) {
55
- var _a, _b, _c;
55
+ var _a;
56
56
  const recommendations = [];
57
57
  try {
58
58
  const wikidataURL = this.getWikidataURL(query);
59
59
  const wikidataResponse = await fetch(wikidataURL);
60
60
  const searchResults = await wikidataResponse.json();
61
- console.log('wikidata results', searchResults);
62
61
  for (const [keyword, facets] of Object.entries(WIKIDATA_ENTITIES)) {
63
- console.log('testing keyword', keyword);
64
62
  const keywordRegex = new RegExp(`\\b${keyword}\\b`);
65
- console.log('regex', keywordRegex);
66
- console.log('description', (_a = searchResults.search[0]) === null || _a === void 0 ? void 0 : _a.description);
67
- console.log('test', keywordRegex.test((_b = searchResults.search[0]) === null || _b === void 0 ? void 0 : _b.description));
68
- if (keywordRegex.test((_c = searchResults.search[0]) === null || _c === void 0 ? void 0 : _c.description)) {
63
+ if (keywordRegex.test((_a = searchResults.search[0]) === null || _a === void 0 ? void 0 : _a.description)) {
69
64
  const entityName = searchResults.search[0].label;
70
65
  recommendations.push(...this.replaceQueryPlaceholders(facets, entityName));
71
66
  }
72
- console.log('recs', recommendations);
73
67
  }
74
68
  return recommendations;
75
69
  }
@@ -1 +1 @@
1
- {"version":3,"file":"wikidata-heuristic.js","sourceRoot":"","sources":["../../../../../../src/collection-facets/smart-facets/heuristics/wikidata/wikidata-heuristic.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,iBAAiB,EAAE,MAAM,uBAAuB,CAAC;AAE1D,4EAA4E;AAC5E,mBAAmB;AACnB,0BAA0B;AAC1B,2BAA2B;AAC3B,8CAA8C;AAC9C,+CAA+C;AAC/C,8CAA8C;AAC9C,8CAA8C;AAC9C,OAAO;AACP,MAAM,OAAO,iBAAiB;IAA9B;QACmB,sBAAiB,GAAG,oCAAoC,CAAC;QAEzD,0BAAqB,GACpC,wFAAwF,CAAC;IA+E7F,CAAC;IA7EC;;;OAGG;IACK,cAAc,CAAC,KAAa;QAClC,MAAM,QAAQ,GAAG,kBAAkB,CAAC,KAAK,CAAC,CAAC;QAC3C,OAAO,GAAG,IAAI,CAAC,iBAAiB,GAAG,IAAI,CAAC,qBAAqB,WAAW,QAAQ,EAAE,CAAC;IACrF,CAAC;IAED;;;;;OAKG;IACK,wBAAwB,CAC9B,WAAyB,EACzB,KAAa;QAEb,OAAO,WAAW,CAAC,GAAG,CACpB,UAAU,CAAC,EAAE;;YACX,OAAA,CAAC;gBACC,oDAAoD;gBACpD,KAAK,EAAE,MAAA,UAAU,CAAC,KAAK,0CAAE,OAAO,CAAC,SAAS,EAAE,KAAK,CAAC;gBAClD,6EAA6E;gBAC7E,MAAM,EAAE,UAAU,CAAC,MAAM,CAAC,GAAG,CAAC,KAAK,CAAC,EAAE;;oBACpC,MAAM,QAAQ,GAAG;wBACf,GAAG,KAAK;wBACR,SAAS,EAAE,KAAK,CAAC,SAAS,CAAC,OAAO,CAAC,SAAS,EAAE,KAAK,CAAC;qBACrD,CAAC;oBAEF,IAAI,KAAK,CAAC,WAAW,EAAE,CAAC;wBACtB,QAAQ,CAAC,WAAW,GAAG,MAAA,QAAQ,CAAC,WAAW,0CAAE,OAAO,CAClD,SAAS,EACT,KAAK,CACN,CAAC;oBACJ,CAAC;oBAED,OAAO,QAAQ,CAAC;gBAClB,CAAC,CAAC;aACH,CAAe,CAAA;SAAA,CACnB,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,oBAAoB,CAAC,KAAa;;QACtC,MAAM,eAAe,GAAiB,EAAE,CAAC;QAEzC,IAAI,CAAC;YACH,MAAM,WAAW,GAAG,IAAI,CAAC,cAAc,CAAC,KAAK,CAAC,CAAC;YAC/C,MAAM,gBAAgB,GAAG,MAAM,KAAK,CAAC,WAAW,CAAC,CAAC;YAClD,MAAM,aAAa,GAAG,MAAM,gBAAgB,CAAC,IAAI,EAAE,CAAC;YACpD,OAAO,CAAC,GAAG,CAAC,kBAAkB,EAAE,aAAa,CAAC,CAAC;YAE/C,KAAK,MAAM,CAAC,OAAO,EAAE,MAAM,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,iBAAiB,CAAC,EAAE,CAAC;gBAClE,OAAO,CAAC,GAAG,CAAC,iBAAiB,EAAE,OAAO,CAAC,CAAC;gBACxC,MAAM,YAAY,GAAG,IAAI,MAAM,CAAC,MAAM,OAAO,KAAK,CAAC,CAAC;gBACpD,OAAO,CAAC,GAAG,CAAC,OAAO,EAAE,YAAY,CAAC,CAAC;gBACnC,OAAO,CAAC,GAAG,CAAC,aAAa,EAAE,MAAA,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,0CAAE,WAAW,CAAC,CAAC;gBACjE,OAAO,CAAC,GAAG,CAAC,MAAM,EAAE,YAAY,CAAC,IAAI,CAAC,MAAA,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,0CAAE,WAAW,CAAC,CAAC,CAAC;gBAC7E,IAAI,YAAY,CAAC,IAAI,CAAC,MAAA,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,0CAAE,WAAW,CAAC,EAAE,CAAC;oBAC5D,MAAM,UAAU,GAAG,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC;oBACjD,eAAe,CAAC,IAAI,CAClB,GAAG,IAAI,CAAC,wBAAwB,CAAC,MAAM,EAAE,UAAU,CAAC,CACrD,CAAC;gBACJ,CAAC;gBACD,OAAO,CAAC,GAAG,CAAC,MAAM,EAAE,eAAe,CAAC,CAAC;YACvC,CAAC;YAED,OAAO,eAAe,CAAC;QACzB,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;YAClB,OAAO,EAAE,CAAC;QACZ,CAAC;IACH,CAAC;CACF","sourcesContent":["import type { SmartQueryHeuristic, SmartFacet } from '../../models';\nimport { WIKIDATA_ENTITIES } from './wikidata-entity-map';\n\n// If wikidata describes the top query result as X, recommend facet Y, e.g.:\n// X Y\n// written work mt:texts\n// film mt:movies\n// author mt:texts and creator:<query>\n// filmmaker mt:movies and creator:<query>\n// photographer mt:image and creator:<query>\n// visual artist mt:image and creator:<query>\n// etc.\nexport class WikidataHeuristic implements SmartQueryHeuristic {\n private readonly WIKIDATA_BASE_URL = 'https://www.wikidata.org/w/api.php';\n\n private readonly WIKIDATA_DEFAULT_ARGS =\n '?action=wbsearchentities&format=json&language=en&uselang=en&origin=*&type=item&limit=5';\n\n /**\n * Returns the full URL for a Wikidata search for the given query\n * @param query The query to search for\n */\n private getWikidataURL(query: string): string {\n const urlQuery = encodeURIComponent(query);\n return `${this.WIKIDATA_BASE_URL}${this.WIKIDATA_DEFAULT_ARGS}&search=${urlQuery}`;\n }\n\n /**\n * Replaces query placeholders with an actual query string, within a collection of smart facets\n * @param smartFacets The array of smart facets\n * @param query The query string to replace placeholders with\n * @returns A new array of smart facets with all query placeholders replaced\n */\n private replaceQueryPlaceholders(\n smartFacets: SmartFacet[],\n query: string,\n ): SmartFacet[] {\n return smartFacets.map(\n smartFacet =>\n ({\n // Replace placeholders within the smart facet label\n label: smartFacet.label?.replace('__QUERY', query),\n // Replace placeholders within the facets themselves (buckets & display text)\n facets: smartFacet.facets.map(facet => {\n const replaced = {\n ...facet,\n bucketKey: facet.bucketKey.replace('__QUERY', query),\n };\n\n if (facet.displayText) {\n replaced.displayText = replaced.displayText?.replace(\n '__QUERY',\n query,\n );\n }\n\n return replaced;\n }),\n }) as SmartFacet,\n );\n }\n\n /**\n * @inheritdoc\n */\n async getRecommendedFacets(query: string): Promise<SmartFacet[]> {\n const recommendations: SmartFacet[] = [];\n\n try {\n const wikidataURL = this.getWikidataURL(query);\n const wikidataResponse = await fetch(wikidataURL);\n const searchResults = await wikidataResponse.json();\n console.log('wikidata results', searchResults);\n\n for (const [keyword, facets] of Object.entries(WIKIDATA_ENTITIES)) {\n console.log('testing keyword', keyword);\n const keywordRegex = new RegExp(`\\\\b${keyword}\\\\b`);\n console.log('regex', keywordRegex);\n console.log('description', searchResults.search[0]?.description);\n console.log('test', keywordRegex.test(searchResults.search[0]?.description));\n if (keywordRegex.test(searchResults.search[0]?.description)) {\n const entityName = searchResults.search[0].label;\n recommendations.push(\n ...this.replaceQueryPlaceholders(facets, entityName),\n );\n }\n console.log('recs', recommendations);\n }\n\n return recommendations;\n } catch (err) {\n console.warn(err);\n return [];\n }\n }\n}\n"]}
1
+ {"version":3,"file":"wikidata-heuristic.js","sourceRoot":"","sources":["../../../../../../src/collection-facets/smart-facets/heuristics/wikidata/wikidata-heuristic.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,iBAAiB,EAAE,MAAM,uBAAuB,CAAC;AAE1D,4EAA4E;AAC5E,mBAAmB;AACnB,0BAA0B;AAC1B,2BAA2B;AAC3B,8CAA8C;AAC9C,+CAA+C;AAC/C,8CAA8C;AAC9C,8CAA8C;AAC9C,OAAO;AACP,MAAM,OAAO,iBAAiB;IAA9B;QACmB,sBAAiB,GAAG,oCAAoC,CAAC;QAEzD,0BAAqB,GACpC,wFAAwF,CAAC;IAyE7F,CAAC;IAvEC;;;OAGG;IACK,cAAc,CAAC,KAAa;QAClC,MAAM,QAAQ,GAAG,kBAAkB,CAAC,KAAK,CAAC,CAAC;QAC3C,OAAO,GAAG,IAAI,CAAC,iBAAiB,GAAG,IAAI,CAAC,qBAAqB,WAAW,QAAQ,EAAE,CAAC;IACrF,CAAC;IAED;;;;;OAKG;IACK,wBAAwB,CAC9B,WAAyB,EACzB,KAAa;QAEb,OAAO,WAAW,CAAC,GAAG,CACpB,UAAU,CAAC,EAAE;;YACX,OAAA,CAAC;gBACC,oDAAoD;gBACpD,KAAK,EAAE,MAAA,UAAU,CAAC,KAAK,0CAAE,OAAO,CAAC,SAAS,EAAE,KAAK,CAAC;gBAClD,6EAA6E;gBAC7E,MAAM,EAAE,UAAU,CAAC,MAAM,CAAC,GAAG,CAAC,KAAK,CAAC,EAAE;;oBACpC,MAAM,QAAQ,GAAG;wBACf,GAAG,KAAK;wBACR,SAAS,EAAE,KAAK,CAAC,SAAS,CAAC,OAAO,CAAC,SAAS,EAAE,KAAK,CAAC;qBACrD,CAAC;oBAEF,IAAI,KAAK,CAAC,WAAW,EAAE,CAAC;wBACtB,QAAQ,CAAC,WAAW,GAAG,MAAA,QAAQ,CAAC,WAAW,0CAAE,OAAO,CAClD,SAAS,EACT,KAAK,CACN,CAAC;oBACJ,CAAC;oBAED,OAAO,QAAQ,CAAC;gBAClB,CAAC,CAAC;aACH,CAAe,CAAA;SAAA,CACnB,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,oBAAoB,CAAC,KAAa;;QACtC,MAAM,eAAe,GAAiB,EAAE,CAAC;QAEzC,IAAI,CAAC;YACH,MAAM,WAAW,GAAG,IAAI,CAAC,cAAc,CAAC,KAAK,CAAC,CAAC;YAC/C,MAAM,gBAAgB,GAAG,MAAM,KAAK,CAAC,WAAW,CAAC,CAAC;YAClD,MAAM,aAAa,GAAG,MAAM,gBAAgB,CAAC,IAAI,EAAE,CAAC;YAEpD,KAAK,MAAM,CAAC,OAAO,EAAE,MAAM,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,iBAAiB,CAAC,EAAE,CAAC;gBAClE,MAAM,YAAY,GAAG,IAAI,MAAM,CAAC,MAAM,OAAO,KAAK,CAAC,CAAC;gBACpD,IAAI,YAAY,CAAC,IAAI,CAAC,MAAA,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,0CAAE,WAAW,CAAC,EAAE,CAAC;oBAC5D,MAAM,UAAU,GAAG,aAAa,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC;oBACjD,eAAe,CAAC,IAAI,CAClB,GAAG,IAAI,CAAC,wBAAwB,CAAC,MAAM,EAAE,UAAU,CAAC,CACrD,CAAC;gBACJ,CAAC;YACH,CAAC;YAED,OAAO,eAAe,CAAC;QACzB,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;YAClB,OAAO,EAAE,CAAC;QACZ,CAAC;IACH,CAAC;CACF","sourcesContent":["import type { SmartQueryHeuristic, SmartFacet } from '../../models';\nimport { WIKIDATA_ENTITIES } from './wikidata-entity-map';\n\n// If wikidata describes the top query result as X, recommend facet Y, e.g.:\n// X Y\n// written work mt:texts\n// film mt:movies\n// author mt:texts and creator:<query>\n// filmmaker mt:movies and creator:<query>\n// photographer mt:image and creator:<query>\n// visual artist mt:image and creator:<query>\n// etc.\nexport class WikidataHeuristic implements SmartQueryHeuristic {\n private readonly WIKIDATA_BASE_URL = 'https://www.wikidata.org/w/api.php';\n\n private readonly WIKIDATA_DEFAULT_ARGS =\n '?action=wbsearchentities&format=json&language=en&uselang=en&origin=*&type=item&limit=5';\n\n /**\n * Returns the full URL for a Wikidata search for the given query\n * @param query The query to search for\n */\n private getWikidataURL(query: string): string {\n const urlQuery = encodeURIComponent(query);\n return `${this.WIKIDATA_BASE_URL}${this.WIKIDATA_DEFAULT_ARGS}&search=${urlQuery}`;\n }\n\n /**\n * Replaces query placeholders with an actual query string, within a collection of smart facets\n * @param smartFacets The array of smart facets\n * @param query The query string to replace placeholders with\n * @returns A new array of smart facets with all query placeholders replaced\n */\n private replaceQueryPlaceholders(\n smartFacets: SmartFacet[],\n query: string,\n ): SmartFacet[] {\n return smartFacets.map(\n smartFacet =>\n ({\n // Replace placeholders within the smart facet label\n label: smartFacet.label?.replace('__QUERY', query),\n // Replace placeholders within the facets themselves (buckets & display text)\n facets: smartFacet.facets.map(facet => {\n const replaced = {\n ...facet,\n bucketKey: facet.bucketKey.replace('__QUERY', query),\n };\n\n if (facet.displayText) {\n replaced.displayText = replaced.displayText?.replace(\n '__QUERY',\n query,\n );\n }\n\n return replaced;\n }),\n }) as SmartFacet,\n );\n }\n\n /**\n * @inheritdoc\n */\n async getRecommendedFacets(query: string): Promise<SmartFacet[]> {\n const recommendations: SmartFacet[] = [];\n\n try {\n const wikidataURL = this.getWikidataURL(query);\n const wikidataResponse = await fetch(wikidataURL);\n const searchResults = await wikidataResponse.json();\n\n for (const [keyword, facets] of Object.entries(WIKIDATA_ENTITIES)) {\n const keywordRegex = new RegExp(`\\\\b${keyword}\\\\b`);\n if (keywordRegex.test(searchResults.search[0]?.description)) {\n const entityName = searchResults.search[0].label;\n recommendations.push(\n ...this.replaceQueryPlaceholders(facets, entityName),\n );\n }\n }\n\n return recommendations;\n } catch (err) {\n console.warn(err);\n return [];\n }\n }\n}\n"]}
package/package.json CHANGED
@@ -3,7 +3,7 @@
3
3
  "description": "The Internet Archive Collection Browser.",
4
4
  "license": "AGPL-3.0-only",
5
5
  "author": "Internet Archive",
6
- "version": "2.8.1-alpha-webdev7002.3",
6
+ "version": "2.9.0",
7
7
  "main": "dist/index.js",
8
8
  "module": "dist/index.js",
9
9
  "scripts": {
@@ -1,13 +1,29 @@
1
1
  import type { KeywordFacetMap, SmartFacet } from '../../models';
2
2
 
3
- const TEXTS: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'texts' }] };
4
- const AUDIO: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'audio' }] };
5
- const MOVIES: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'movies' }] };
6
- const IMAGE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'image' }] };
7
- const SOFTWARE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'software' }] };
8
- const ETREE: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'etree' }] };
9
- const WEB: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'web' }] };
10
- const DATA: SmartFacet = { facets: [{ facetType: 'mediatype', bucketKey: 'data' }] };
3
+ const TEXTS: SmartFacet = {
4
+ facets: [{ facetType: 'mediatype', bucketKey: 'texts' }],
5
+ };
6
+ const AUDIO: SmartFacet = {
7
+ facets: [{ facetType: 'mediatype', bucketKey: 'audio' }],
8
+ };
9
+ const MOVIES: SmartFacet = {
10
+ facets: [{ facetType: 'mediatype', bucketKey: 'movies' }],
11
+ };
12
+ const IMAGE: SmartFacet = {
13
+ facets: [{ facetType: 'mediatype', bucketKey: 'image' }],
14
+ };
15
+ const SOFTWARE: SmartFacet = {
16
+ facets: [{ facetType: 'mediatype', bucketKey: 'software' }],
17
+ };
18
+ const ETREE: SmartFacet = {
19
+ facets: [{ facetType: 'mediatype', bucketKey: 'etree' }],
20
+ };
21
+ const WEB: SmartFacet = {
22
+ facets: [{ facetType: 'mediatype', bucketKey: 'web' }],
23
+ };
24
+ const DATA: SmartFacet = {
25
+ facets: [{ facetType: 'mediatype', bucketKey: 'data' }],
26
+ };
11
27
 
12
28
  /**
13
29
  * Map from keywords found in the search query to an array of
@@ -70,21 +70,15 @@ export class WikidataHeuristic implements SmartQueryHeuristic {
70
70
  const wikidataURL = this.getWikidataURL(query);
71
71
  const wikidataResponse = await fetch(wikidataURL);
72
72
  const searchResults = await wikidataResponse.json();
73
- console.log('wikidata results', searchResults);
74
73
 
75
74
  for (const [keyword, facets] of Object.entries(WIKIDATA_ENTITIES)) {
76
- console.log('testing keyword', keyword);
77
75
  const keywordRegex = new RegExp(`\\b${keyword}\\b`);
78
- console.log('regex', keywordRegex);
79
- console.log('description', searchResults.search[0]?.description);
80
- console.log('test', keywordRegex.test(searchResults.search[0]?.description));
81
76
  if (keywordRegex.test(searchResults.search[0]?.description)) {
82
77
  const entityName = searchResults.search[0].label;
83
78
  recommendations.push(
84
79
  ...this.replaceQueryPlaceholders(facets, entityName),
85
80
  );
86
81
  }
87
- console.log('recs', recommendations);
88
82
  }
89
83
 
90
84
  return recommendations;