2019-05-11 18:37:59 +03:00
|
|
|
import path from 'path'
|
|
|
|
|
|
|
|
import Ner from '@/core/ner'
|
|
|
|
|
|
|
|
describe('NER', () => {
|
|
|
|
describe('constructor()', () => {
|
|
|
|
test('creates a new instance of Ner', () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
|
|
|
|
expect(ner).toBeInstanceOf(Ner)
|
|
|
|
})
|
|
|
|
})
|
|
|
|
|
|
|
|
describe('logExtraction()', () => {
|
|
|
|
test('logs entities extractions', async () => {
|
|
|
|
console.log = jest.fn()
|
|
|
|
|
|
|
|
Ner.logExtraction([
|
|
|
|
{ sourceText: 'shopping', entity: 'list' },
|
|
|
|
{ sourceText: 'red', entity: 'color' }
|
|
|
|
])
|
|
|
|
|
|
|
|
expect(console.log.mock.calls[0][1]).toBe('{ value: shopping, entity: list }')
|
|
|
|
expect(console.log.mock.calls[1][1]).toBe('{ value: red, entity: color }')
|
|
|
|
})
|
|
|
|
})
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
describe('extractEntities()', () => {
|
2019-05-11 18:37:59 +03:00
|
|
|
test('finds no entity', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
const entities = await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
path.join(__dirname, '../../../../packages/leon/data/expressions/en.json'),
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'Give me a random number',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [],
|
|
|
|
classification: {
|
|
|
|
package: 'leon',
|
|
|
|
module: 'randomnumber',
|
|
|
|
action: 'run',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
expect(entities).toEqual([])
|
|
|
|
})
|
|
|
|
|
|
|
|
test('extracts built-in entities', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
Ner.logExtraction = jest.fn()
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
const entities = await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
path.join(__dirname, '../../../../packages/trend/data/expressions/en.json'),
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'Give me the 2 latest GitHub trends',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [{ sourceText: 2, entity: 'number' }],
|
|
|
|
classification: {
|
|
|
|
package: 'trend',
|
|
|
|
module: 'github',
|
|
|
|
action: 'run',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
expect(Ner.logExtraction).toHaveBeenCalledTimes(1)
|
|
|
|
expect(entities.length).toBe(1)
|
|
|
|
})
|
|
|
|
|
|
|
|
test('does not support entity type', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
|
|
|
|
try {
|
2021-04-01 12:07:09 +03:00
|
|
|
await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
global.paths.expressions,
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'Just an utterance',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [],
|
|
|
|
classification: {
|
|
|
|
package: 'doesnotmatter',
|
|
|
|
module: 'unittest',
|
|
|
|
action: 'do_not_support_entity',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
} catch (e) {
|
|
|
|
expect(e.code).toBe('random_ner_type_not_supported')
|
|
|
|
}
|
|
|
|
})
|
|
|
|
|
|
|
|
test('extracts trim custom entities with between conditions', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
Ner.logExtraction = jest.fn()
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
const entities = await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
path.join(__dirname, '../../../../packages/calendar/data/expressions/en.json'),
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'Create a shopping list',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [],
|
|
|
|
classification: {
|
|
|
|
package: 'calendar',
|
|
|
|
module: 'todolist',
|
|
|
|
action: 'create_list',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
expect(Ner.logExtraction).toHaveBeenCalledTimes(1)
|
|
|
|
expect(entities.length).toBe(1)
|
|
|
|
expect(entities[0].entity).toBe('list')
|
|
|
|
expect(entities[0].sourceText).toBe('shopping')
|
|
|
|
})
|
|
|
|
|
|
|
|
test('extracts trim custom entities with before and after conditions', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
Ner.logExtraction = jest.fn()
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
const entities = await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
global.paths.expressions,
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'Please whistle as a bird',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [],
|
|
|
|
classification: {
|
|
|
|
package: 'doesnotmatter',
|
|
|
|
module: 'mockingbird',
|
|
|
|
action: 'test',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
expect(Ner.logExtraction).toHaveBeenCalledTimes(1)
|
|
|
|
console.log('entities', entities)
|
|
|
|
expect(entities.length).toBe(2)
|
2021-03-15 20:39:52 +03:00
|
|
|
expect(entities.map((e) => e.entity)).toEqual(['start', 'animal'])
|
|
|
|
expect(entities.map((e) => e.sourceText)).toEqual(['Please whistle as a', 'bird'])
|
2019-05-11 18:37:59 +03:00
|
|
|
})
|
|
|
|
|
|
|
|
test('extracts regex custom entities', async () => {
|
|
|
|
const ner = new Ner()
|
|
|
|
Ner.logExtraction = jest.fn()
|
|
|
|
|
2021-04-01 12:07:09 +03:00
|
|
|
const entities = await ner.extractEntities(
|
2019-05-11 18:37:59 +03:00
|
|
|
'en',
|
|
|
|
global.paths.expressions,
|
|
|
|
{
|
2022-02-10 16:47:43 +03:00
|
|
|
utterance: 'I love the color blue, white and red',
|
2019-05-11 18:37:59 +03:00
|
|
|
entities: [],
|
|
|
|
classification: {
|
|
|
|
package: 'preference',
|
|
|
|
module: 'color',
|
|
|
|
action: 'run',
|
|
|
|
confidence: 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
expect(Ner.logExtraction).toHaveBeenCalledTimes(1)
|
|
|
|
expect(entities.length).toBe(3)
|
2021-03-15 20:39:52 +03:00
|
|
|
expect(entities.map((e) => e.entity)).toEqual(['color', 'color', 'color'])
|
|
|
|
expect(entities.map((e) => e.sourceText)).toEqual(['blue', 'white', 'red'])
|
2019-05-11 18:37:59 +03:00
|
|
|
})
|
|
|
|
})
|
|
|
|
})
|