Skip to content

Commit

Permalink
support both dcat us 1.1 and 3.0
Browse files Browse the repository at this point in the history
  • Loading branch information
sansth1010 committed Nov 21, 2024
1 parent 4aef6c3 commit 072a4ae
Show file tree
Hide file tree
Showing 7 changed files with 272 additions and 43 deletions.
85 changes: 79 additions & 6 deletions src/dcat-us/compile-dcat-feed.test.ts
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,82 @@ import { compileDcatFeedEntry } from './compile-dcat-feed';
import * as datasetFromApi from '../test-helpers/mock-dataset.json';
import { DcatUsError } from './dcat-us-error';

describe('generating DCAT-US 1.0 feed', () => {
const version = '1.1';
it('should throw 400 DcatUs error if template contains transformer that is not defined', async function () {
const dcatTemplate = {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
issued: '{{created:toISO}}'
}

try {
compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version);
} catch (error) {
expect(error).toBeInstanceOf(DcatUsError);
expect(error).toHaveProperty('statusCode', 400);
}
});

it('show return distribution in a single array', async function () {
const dcatTemplate = {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
distribution: [
'distro1',
'distro2',
['distro3', 'distro4']
]
}

const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version));
expect(dcatDataset.distribution).toBeDefined();
expect(dcatDataset.distribution).toStrictEqual(['distro1', 'distro2', 'distro3', 'distro4']);
});

it('show not return uninterpolated distribution in dataset', async function () {
const dcatTemplate = {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
distribution: ['distro1', '{{distroname}}']
}
const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version));
expect(dcatDataset.distribution).toStrictEqual(['distro1']);
});

it('should contain default theme if spatial key exists in dataset', async function () {
const distribution = ['distro1', '{{distroname}}'];
const dcatTemplate = {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
distribution,
spatial: '{{extent}}'
}
const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version));
expect(dcatDataset.theme).toBeDefined();
expect(dcatDataset.theme).toStrictEqual(['geospatial']);
});

it('should throw error if geojson from provider is missing', async function () {
const dcatTemplate = {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
issued: '{{created:toISO}}'
};

expect(() => {
compileDcatFeedEntry(undefined, dcatTemplate, {}, version);
}).toThrow(DcatUsError);
});
});

describe('generating DCAT-US 3.0 feed', () => {
const version = '3.0';
it('should throw 400 DcatUs error if template contains transformer that is not defined', async function () {
const dcatTemplate = {
title: '{{name}}',
Expand All @@ -12,7 +87,7 @@ describe('generating DCAT-US 3.0 feed', () => {
}

try {
compileDcatFeedEntry(datasetFromApi, dcatTemplate, {});
compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version);
} catch (error) {
expect(error).toBeInstanceOf(DcatUsError);
expect(error).toHaveProperty('statusCode', 400);
Expand All @@ -31,7 +106,7 @@ describe('generating DCAT-US 3.0 feed', () => {
]
}

const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}));
const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version));
expect(dcatDataset['dcat:distribution']).toBeDefined();
expect(dcatDataset['dcat:distribution']).toStrictEqual(['distro1', 'distro2', 'distro3', 'distro4']);
});
Expand All @@ -43,7 +118,7 @@ describe('generating DCAT-US 3.0 feed', () => {
keyword: '{{tags}}',
'dcat:distribution': ['distro1', '{{distroname}}']
}
const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}));
const dcatDataset = JSON.parse(compileDcatFeedEntry(datasetFromApi, dcatTemplate, {}, version));
expect(dcatDataset['dcat:distribution']).toStrictEqual(['distro1']);
});

Expand All @@ -56,9 +131,7 @@ describe('generating DCAT-US 3.0 feed', () => {
};

expect(() => {
compileDcatFeedEntry(undefined, dcatTemplate, {});
compileDcatFeedEntry(undefined, dcatTemplate, {}, version);
}).toThrow(DcatUsError);

});

});
32 changes: 25 additions & 7 deletions src/dcat-us/compile-dcat-feed.ts
Original file line number Diff line number Diff line change
Expand Up @@ -9,15 +9,33 @@ type Feature = {
properties: Record<string, any>
};

export function compileDcatFeedEntry(geojsonFeature: Feature | undefined, feedTemplate: DcatDatasetTemplate, feedTemplateTransforms: TransformsList): string {
export function compileDcatFeedEntry(
geojsonFeature: Feature | undefined,
feedTemplate: DcatDatasetTemplate,
feedTemplateTransforms: TransformsList,
version: string
): string {
try {
const dcatFeedItem = generateDcatItem(feedTemplate, feedTemplateTransforms, geojsonFeature);
return indent(JSON.stringify({
...dcatFeedItem,
'dcat:distribution':
Array.isArray(dcatFeedItem['dcat:distribution']) &&
removeUninterpolatedDistributions(_.flatten(dcatFeedItem['dcat:distribution'])),
}, null, '\t'), 2);
let feedEntry: Record<string, any>;
if (version === '1.1') {
feedEntry = {
...dcatFeedItem,
distribution: Array.isArray(dcatFeedItem.distribution) && removeUninterpolatedDistributions(_.flatten(dcatFeedItem.distribution)),
theme: dcatFeedItem.spatial && ['geospatial']
};
}

if (version === '3.0') {
feedEntry = {
...dcatFeedItem,
'dcat:distribution':
Array.isArray(dcatFeedItem['dcat:distribution']) &&
removeUninterpolatedDistributions(_.flatten(dcatFeedItem['dcat:distribution'])),
};
}

return indent(JSON.stringify(feedEntry, null, '\t'), 2);
} catch (err) {
throw new DcatUsError(err.message, 400);
}
Expand Down
13 changes: 12 additions & 1 deletion src/dcat-us/constants/contexts.ts
Original file line number Diff line number Diff line change
@@ -1,4 +1,15 @@
export const HEADER_V3 = {
// Context header for DCAT US 1.1
export const HEADER_V_1_1 = {
'@context':
'https://project-open-data.cio.gov/v1.1/schema/catalog.jsonld',
'@type': 'dcat:Catalog',
conformsTo: 'https://project-open-data.cio.gov/v1.1/schema',
describedBy: 'https://project-open-data.cio.gov/v1.1/schema/catalog.json',
};

// Context header for DCAT US 3.0
// source: https://raw.githubusercontent.com/DOI-DO/dcat-us/refs/heads/main/context/dcat-us-3.0.jsonld
export const HEADER_V_3 = {
'@context': {
'@version': 1.1,
'@protected': true,
Expand Down
79 changes: 67 additions & 12 deletions src/dcat-us/index.test.ts
Original file line number Diff line number Diff line change
@@ -1,21 +1,74 @@
import { readableFromArray, streamToString } from '../test-helpers/stream-utils';
import { getDataStreamDcatUs11 } from './';
import { getDataStreamDcatUs } from './';
import * as datasetFromApi from '../test-helpers/mock-dataset.json';
import { HEADER_V3 } from './constants/contexts';
import { HEADER_V_3 } from './constants/contexts';

async function generateDcatFeed(dataset, template, templateTransforms) {
const { stream: dcatStream } = getDataStreamDcatUs11(template, templateTransforms);
async function generateDcatFeed(dataset, template, templateTransforms, version) {
const { stream: dcatStream } = getDataStreamDcatUs(template, templateTransforms, version);

const docStream = readableFromArray([dataset]); // no datasets since we're just checking the catalog
const feedString = await streamToString(docStream.pipe(dcatStream));
return { feed: JSON.parse(feedString) };
}

describe('generating DCAT-US 1.1 feed', () => {
const version = '1.1';
it('formats catalog correctly', async function () {
const { feed } = await generateDcatFeed([], {}, {}, version);

expect(feed['@context']).toBe('https://project-open-data.cio.gov/v1.1/schema/catalog.jsonld');
expect(feed['@type']).toBe('dcat:Catalog');
expect(feed['conformsTo']).toBe('https://project-open-data.cio.gov/v1.1/schema');
expect(feed['describedBy']).toBe('https://project-open-data.cio.gov/v1.1/schema/catalog.json');
expect(Array.isArray(feed['dataset'])).toBeTruthy();
});

it('should interprolate dataset stream to feed based upon template', async function () {
const { feed } = await generateDcatFeed(datasetFromApi, {
title: '{{name}}',
description: '{{description}}',
keyword: '{{tags}}',
issued: '{{created:toISO}}',
modified: '{{modified:toISO}}',
publisher: {
name: '{{source}}'
},
contactPoint: {
'@type': 'vcard:Contact',
fn: '{{owner}}',
hasEmail: '{{orgContactEmail:optional}}'
}
},
{
toISO: (_key, val) => {
return new Date(val).toISOString();
}
},
version);

expect(feed['@context']).toBe('https://project-open-data.cio.gov/v1.1/schema/catalog.jsonld');
expect(feed['@type']).toBe('dcat:Catalog');
expect(feed['conformsTo']).toBe('https://project-open-data.cio.gov/v1.1/schema');
expect(feed['describedBy']).toBe('https://project-open-data.cio.gov/v1.1/schema/catalog.json');
expect(Array.isArray(feed['dataset'])).toBeTruthy();
expect(feed['dataset'].length).toBe(1);
const feedResponse = feed['dataset'][0];
expect(feedResponse.title).toBe('Tahoe places of interest');
expect(feedResponse.description).toBe('Description. Here be Tahoe things. You can do a lot here. Here are some more words. And a few more.<div><br /></div><div>with more words</div><div><br /></div><div>adding a few more to test how long it takes for our jobs to execute.</div><div><br /></div><div>Tom was here!</div>');
expect(feedResponse.issued).toBe('2021-01-29T15:34:38.000Z');
expect(feedResponse.modified).toBe('2021-07-27T20:25:19.723Z');
expect(feedResponse.contactPoint).toStrictEqual({ '@type': 'vcard:Contact', fn: 'thervey_qa_pre_a_hub' });
expect(feedResponse.publisher).toStrictEqual({ name: 'QA Premium Alpha Hub' });
expect(feedResponse.keyword).toStrictEqual(['Data collection', 'just modified']);
});
});

describe('generating DCAT-US 3.0 feed', () => {
const version = '3.0';
it('formats catalog correctly', async function () {
const { feed } = await generateDcatFeed([], {}, {});
const { feed } = await generateDcatFeed([], {}, {}, version);

expect(feed['@context']).toStrictEqual(HEADER_V3['@context']);
expect(feed['@context']).toStrictEqual(HEADER_V_3['@context']);
expect(feed['conformsTo']).toBe('https://resource.data.gov/profile/dcat-us#');
expect(feed['@type']).toBe('dcat:Catalog');
expect(Array.isArray(feed['dcat:dataset'])).toBeTruthy();
Expand All @@ -39,13 +92,15 @@ describe('generating DCAT-US 3.0 feed', () => {
header: {
'@id': 'hub.arcgis.com'
}
}, {
toISO: (_key, val) => {
return new Date(val).toISOString();
}
});
},
{
toISO: (_key, val) => {
return new Date(val).toISOString();
}
},
version);

expect(feed['@context']).toStrictEqual(HEADER_V3['@context']);
expect(feed['@context']).toStrictEqual(HEADER_V_3['@context']);
expect(feed['@type']).toBe('dcat:Catalog');
expect(feed['@id']).toBe('hub.arcgis.com');
expect(feed['conformsTo']).toBe('https://resource.data.gov/profile/dcat-us#');
Expand Down
26 changes: 20 additions & 6 deletions src/dcat-us/index.ts
Original file line number Diff line number Diff line change
@@ -1,17 +1,31 @@
import { compileDcatFeedEntry } from './compile-dcat-feed';
import { FeedFormatterStream } from './feed-formatter-stream';
import { TransformsList } from 'adlib';
import { HEADER_V3 } from './constants/contexts';
import { HEADER_V_3, HEADER_V_1_1 } from './constants/contexts';

export function getDataStreamDcatUs11(feedTemplate: any, feedTemplateTransforms: TransformsList) {
export function getDataStreamDcatUs(feedTemplate: any, feedTemplateTransforms: TransformsList, version: string) {
const footer = '\n\t]\n}';
const { header: templateHeader, ...restFeedTemplate } = feedTemplate;
let header: string;
let template: Record<string, any>;

if (version === '3.0') {
const { header: templateHeader, ...restFeedTemplate } = feedTemplate;
template = restFeedTemplate;
const catalogStr = JSON.stringify({ ...HEADER_V_3, ...templateHeader }, null, '\t');
header = `${catalogStr.substring(0, catalogStr.length - 2)},\n\t"dcat:dataset": [\n`;
}

const catalogStr = JSON.stringify({ ...HEADER_V3, ...templateHeader }, null, '\t');
const header = `${catalogStr.substring(0, catalogStr.length - 2)},\n\t"dcat:dataset": [\n`;
if (version === '1.1') {
const catalogStr = JSON.stringify(HEADER_V_1_1, null, '\t');
header = `${catalogStr.substring(
0,
catalogStr.length - 2,
)},\n\t"dataset": [\n`;
template = feedTemplate;
}

const formatFn = (chunk) => {
return compileDcatFeedEntry(chunk, restFeedTemplate, feedTemplateTransforms);
return compileDcatFeedEntry(chunk, template, feedTemplateTransforms, version);
};

return {
Expand Down
Loading

0 comments on commit 072a4ae

Please sign in to comment.