feat: add lead qualification workflow
This commit is contained in:
@@ -4,10 +4,14 @@ import test from "node:test";
|
||||
import {
|
||||
GOOGLE_PLACES_FIELD_MASK,
|
||||
buildGeocodingUrl,
|
||||
getUsableContactEmail,
|
||||
getUsableContactEmailFromEntries,
|
||||
getBlacklistMatches,
|
||||
getBlacklistLookupValues,
|
||||
getPlacesSearchSpec,
|
||||
isProbableDuplicateCandidate,
|
||||
isDuplicateCandidate,
|
||||
normalizeEmailAddress,
|
||||
normalizePlacesResponse,
|
||||
parseGeocodingResponse,
|
||||
} from "../lib/lead-discovery-google";
|
||||
@@ -205,8 +209,12 @@ test("places normalization maps source metadata and normalizes website domain",
|
||||
|
||||
test("duplicate detection uses placeId and websiteDomain", () => {
|
||||
const existingLeads = [
|
||||
{ googlePlaceId: "dup-1", websiteDomain: "other.de" },
|
||||
{ googlePlaceId: "other-2", websiteDomain: "example.de" },
|
||||
{
|
||||
googlePlaceId: "dup-1",
|
||||
websiteDomain: "other.de",
|
||||
email: "blocked@example.de",
|
||||
},
|
||||
{ googlePlaceId: "other-2", websiteDomain: "example.de", email: "blocked@example.de" },
|
||||
];
|
||||
|
||||
assert.equal(
|
||||
@@ -277,6 +285,158 @@ test("duplicate detection uses placeId and websiteDomain", () => {
|
||||
),
|
||||
false,
|
||||
);
|
||||
|
||||
assert.equal(
|
||||
isDuplicateCandidate(
|
||||
{
|
||||
placeId: "none",
|
||||
businessName: "Test",
|
||||
address: "A",
|
||||
websiteUrl: "https://www.example.de",
|
||||
websiteDomain: "new.de",
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
contactEmails: [{ email: "Owner@Example.De", isBusinessContactAddress: false }],
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
false,
|
||||
);
|
||||
|
||||
assert.equal(
|
||||
isDuplicateCandidate(
|
||||
{
|
||||
placeId: "none",
|
||||
businessName: "Test",
|
||||
address: "A",
|
||||
websiteUrl: "https://www.new.de",
|
||||
websiteDomain: "new.de",
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
contactEmails: [{ email: "newlead@new.de" }],
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
false,
|
||||
);
|
||||
|
||||
assert.equal(
|
||||
isDuplicateCandidate(
|
||||
{
|
||||
placeId: "none",
|
||||
businessName: "Test",
|
||||
address: "A",
|
||||
websiteUrl: "https://www.example.de",
|
||||
websiteDomain: "new.de",
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
email: "Blocked@Example.De",
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
true,
|
||||
);
|
||||
});
|
||||
|
||||
test("probable duplicates are detected by normalized company+address or normalized phone", () => {
|
||||
const existingLeads = [
|
||||
{
|
||||
googlePlaceId: "dup-1",
|
||||
companyName: "Muster GmbH",
|
||||
address: "Hauptstraße 1, 60311 Frankfurt am Main",
|
||||
phone: "+49 30 123456",
|
||||
},
|
||||
];
|
||||
|
||||
assert.equal(
|
||||
isProbableDuplicateCandidate(
|
||||
{
|
||||
placeId: "none-1",
|
||||
businessName: "Muster GmbH",
|
||||
address: "Hauptstraße 1, 60311 Frankfurt am Main",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
true,
|
||||
);
|
||||
|
||||
assert.equal(
|
||||
isProbableDuplicateCandidate(
|
||||
{
|
||||
placeId: "none-2",
|
||||
businessName: "Other GmbH",
|
||||
address: "Nebenstraße 9",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: "0049 30 123456",
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
true,
|
||||
);
|
||||
|
||||
assert.equal(
|
||||
isProbableDuplicateCandidate(
|
||||
{
|
||||
placeId: "none-3",
|
||||
businessName: "Different GmbH",
|
||||
address: "Musterallee 5",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: "+49 89 999999",
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
},
|
||||
existingLeads,
|
||||
),
|
||||
false,
|
||||
);
|
||||
});
|
||||
|
||||
test("blacklist matches include google_place_id, domain, company and phone", () => {
|
||||
@@ -287,6 +447,8 @@ test("blacklist matches include google_place_id, domain, company and phone", ()
|
||||
websiteUrl: "https://www.Blocked.de",
|
||||
websiteDomain: "blocked.de",
|
||||
phone: "+49 30 555 123",
|
||||
email: "Info@Blocked.De",
|
||||
contactEmails: [{ email: "Hello@blocked.de", isBusinessContactAddress: false }],
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
@@ -303,6 +465,8 @@ test("blacklist matches include google_place_id, domain, company and phone", ()
|
||||
{ type: "company", normalizedValue: "muster gmbh" },
|
||||
{ type: "phone", normalizedValue: "4930555123" },
|
||||
{ type: "phone", normalizedValue: "+49 30 555 123" },
|
||||
{ type: "email", normalizedValue: "info@blocked.de" },
|
||||
{ type: "email", normalizedValue: "hello@blocked.de" },
|
||||
]);
|
||||
|
||||
const matches = getBlacklistMatches(
|
||||
@@ -323,12 +487,213 @@ test("blacklist matches include google_place_id, domain, company and phone", ()
|
||||
},
|
||||
{ type: "email", value: "x@example.de", normalizedValue: "x@example.de" },
|
||||
{ type: "phone", value: "+49 30 999 999", normalizedValue: "4930999999" },
|
||||
{
|
||||
type: "email",
|
||||
value: "Info@Blocked.De",
|
||||
normalizedValue: "info@blocked.de",
|
||||
},
|
||||
],
|
||||
);
|
||||
|
||||
const matchTypes = matches.map((match) => match.type).sort();
|
||||
assert.deepEqual(
|
||||
matchTypes,
|
||||
["company", "domain", "google_place_id", "phone", "phone"].sort(),
|
||||
["company", "domain", "google_place_id", "phone", "phone", "email"].sort(),
|
||||
);
|
||||
});
|
||||
|
||||
test("company normalization for blacklist lookup uses text normalization", () => {
|
||||
const candidate = {
|
||||
placeId: "place-company-spaces",
|
||||
businessName: "Muster GmbH",
|
||||
address: "A",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: "+49 30 555 123",
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places" as const,
|
||||
sourceFetchedAt: 0,
|
||||
};
|
||||
|
||||
assert.deepEqual(getBlacklistLookupValues(candidate), [
|
||||
{ type: "google_place_id", normalizedValue: "place-company-spaces" },
|
||||
{ type: "company", normalizedValue: "muster gmbh" },
|
||||
{ type: "phone", normalizedValue: "4930555123" },
|
||||
{ type: "phone", normalizedValue: "+49 30 555 123" },
|
||||
]);
|
||||
});
|
||||
|
||||
test("company blacklist matching supports whitespace-normalized names", () => {
|
||||
const candidate = {
|
||||
placeId: "place-company-spaces-2",
|
||||
businessName: "Muster GmbH",
|
||||
address: "A",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places" as const,
|
||||
sourceFetchedAt: 0,
|
||||
};
|
||||
|
||||
const matches = getBlacklistMatches(candidate, [
|
||||
{ type: "company", value: "Muster GmbH", normalizedValue: "muster gmbh" },
|
||||
]);
|
||||
|
||||
assert.equal(matches.length, 1);
|
||||
assert.equal(matches[0]!.normalizedValue, "muster gmbh");
|
||||
});
|
||||
|
||||
test("email normalization strips whitespace, lowercases, and rejects malformed addresses", () => {
|
||||
assert.equal(normalizeEmailAddress(" INFO@Example.DE "), "info@example.de");
|
||||
assert.equal(normalizeEmailAddress("hello@domain"), null);
|
||||
assert.equal(normalizeEmailAddress("no-at-symbol"), null);
|
||||
assert.equal(normalizeEmailAddress("@missing-local.com"), null);
|
||||
assert.equal(normalizeEmailAddress("name@"), null);
|
||||
assert.equal(normalizeEmailAddress(""), null);
|
||||
assert.equal(normalizeEmailAddress("näm@beispiel.de"), null);
|
||||
});
|
||||
|
||||
test("usable email helper prefers generic business aliases and requires explicit metadata for named contacts", () => {
|
||||
const genericPreferred = getUsableContactEmail({
|
||||
placeId: "place-1",
|
||||
businessName: "Bäckerei",
|
||||
address: "Musterweg 1",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
contactEmails: [
|
||||
{
|
||||
email: "müller@bäckerei.de",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
{
|
||||
email: "Hello@Bäckerei.De",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
{
|
||||
email: "owner@Bäckerei.De",
|
||||
isBusinessContactAddress: true,
|
||||
},
|
||||
],
|
||||
});
|
||||
|
||||
assert.deepEqual(genericPreferred, {
|
||||
email: "hello@bäckerei.de",
|
||||
emailSource: null,
|
||||
contactPerson: null,
|
||||
});
|
||||
|
||||
const namedWithoutMetadata = getUsableContactEmail({
|
||||
placeId: "place-2",
|
||||
businessName: "Bäckerei",
|
||||
address: "Musterweg 2",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
contactEmails: [
|
||||
{
|
||||
email: "owner@Bäckerei.De",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
],
|
||||
});
|
||||
|
||||
assert.equal(namedWithoutMetadata, null);
|
||||
|
||||
const namedWithMetadata = getUsableContactEmail({
|
||||
placeId: "place-3",
|
||||
businessName: "Bäckerei",
|
||||
address: "Musterweg 3",
|
||||
websiteUrl: null,
|
||||
websiteDomain: null,
|
||||
phone: null,
|
||||
rating: null,
|
||||
userRatingCount: null,
|
||||
businessStatus: null,
|
||||
googleTypes: [],
|
||||
googlePrimaryType: null,
|
||||
googleMapsUrl: null,
|
||||
sourceProvider: "google_places",
|
||||
sourceFetchedAt: 0,
|
||||
contactEmails: [
|
||||
{
|
||||
email: "owner@Bäckerei.De",
|
||||
isBusinessContactAddress: true,
|
||||
},
|
||||
],
|
||||
});
|
||||
|
||||
assert.deepEqual(namedWithMetadata, {
|
||||
email: "owner@bäckerei.de",
|
||||
emailSource: null,
|
||||
contactPerson: null,
|
||||
});
|
||||
});
|
||||
|
||||
test("standalone contact-email rule helper rejects invalid entries and prefers generic aliases", () => {
|
||||
const validGeneric = getUsableContactEmailFromEntries([
|
||||
{
|
||||
email: "owner@firma.de",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
{
|
||||
email: "support@firma.de",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
{
|
||||
email: "hello@firma.de",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
]);
|
||||
|
||||
assert.deepEqual(validGeneric, {
|
||||
email: "hello@firma.de",
|
||||
emailSource: null,
|
||||
contactPerson: null,
|
||||
});
|
||||
|
||||
const rejectedNamed = getUsableContactEmailFromEntries([
|
||||
{
|
||||
email: "owner@firma.de",
|
||||
isBusinessContactAddress: false,
|
||||
},
|
||||
]);
|
||||
|
||||
assert.equal(rejectedNamed, null);
|
||||
|
||||
const invalid = getUsableContactEmailFromEntries([
|
||||
{
|
||||
email: "no-at-symbol",
|
||||
isBusinessContactAddress: true,
|
||||
},
|
||||
]);
|
||||
|
||||
assert.equal(invalid, null);
|
||||
});
|
||||
|
||||
Reference in New Issue
Block a user