make-mp-data 3.0.3 → 3.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +46 -0
- package/dungeons/array-of-object-lookup-schema.json +327 -0
- package/dungeons/array-of-object-lookup.js +29 -9
- package/dungeons/capstone/capstone-ic3.js +291 -0
- package/dungeons/capstone/capstone-ic4.js +598 -0
- package/dungeons/capstone/capstone-ic5.js +668 -0
- package/dungeons/capstone/generate-product-lookup.js +309 -0
- package/dungeons/ecommerce-schema.json +462 -0
- package/dungeons/{copilot.js → ecommerce.js} +79 -17
- package/dungeons/education-schema.json +2409 -0
- package/dungeons/education.js +226 -462
- package/dungeons/fintech-schema.json +14034 -0
- package/dungeons/fintech.js +134 -413
- package/dungeons/foobar-schema.json +403 -0
- package/dungeons/foobar.js +27 -4
- package/dungeons/food-delivery-schema.json +192 -0
- package/dungeons/food-delivery.js +602 -0
- package/dungeons/food-schema.json +1152 -0
- package/dungeons/food.js +173 -406
- package/dungeons/gaming-schema.json +1270 -0
- package/dungeons/gaming.js +182 -42
- package/dungeons/insurance-application-schema.json +204 -0
- package/dungeons/insurance-application.js +605 -0
- package/dungeons/media-schema.json +906 -0
- package/dungeons/media.js +250 -420
- package/dungeons/retention-cadence-schema.json +78 -0
- package/dungeons/retention-cadence.js +35 -1
- package/dungeons/rpg-schema.json +4526 -0
- package/dungeons/rpg.js +171 -429
- package/dungeons/sanity-schema.json +255 -0
- package/dungeons/sanity.js +21 -10
- package/dungeons/sass-schema.json +1291 -0
- package/dungeons/sass.js +241 -368
- package/dungeons/scd-schema.json +919 -0
- package/dungeons/scd.js +41 -13
- package/dungeons/simple-schema.json +608 -0
- package/dungeons/simple.js +52 -15
- package/dungeons/simplest-schema.json +1418 -0
- package/dungeons/simplest.js +392 -0
- package/dungeons/social-schema.json +1118 -0
- package/dungeons/social.js +150 -391
- package/dungeons/text-generation-schema.json +3096 -0
- package/dungeons/text-generation.js +71 -0
- package/index.js +8 -6
- package/lib/core/config-validator.js +28 -8
- package/lib/core/storage.js +5 -5
- package/lib/generators/events.js +4 -4
- package/lib/orchestrators/mixpanel-sender.js +16 -13
- package/lib/orchestrators/user-loop.js +14 -6
- package/lib/templates/soup-presets.js +188 -0
- package/lib/utils/utils.js +52 -6
- package/package.json +1 -1
- package/types.d.ts +20 -3
- package/dungeons/adspend.js +0 -130
- package/dungeons/anon.js +0 -128
- package/dungeons/benchmark-heavy.js +0 -240
- package/dungeons/benchmark-light.js +0 -140
- package/dungeons/big.js +0 -226
- package/dungeons/business.js +0 -391
- package/dungeons/complex.js +0 -428
- package/dungeons/experiments.js +0 -137
- package/dungeons/funnels.js +0 -309
- package/dungeons/mil.js +0 -323
- package/dungeons/mirror.js +0 -161
- package/dungeons/soup-test.js +0 -52
- package/dungeons/streaming.js +0 -372
- package/dungeons/strict-event-test.js +0 -30
- package/dungeons/student-teacher.js +0 -438
- package/dungeons/too-big-events.js +0 -203
- package/dungeons/user-agent.js +0 -209
|
@@ -0,0 +1,291 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* ═══════════════════════════════════════════════════════════════
|
|
3
|
+
* DATASET OVERVIEW
|
|
4
|
+
* ═══════════════════════════════════════════════════════════════
|
|
5
|
+
*
|
|
6
|
+
* IC3 Capstone — e-commerce dataset for Mixpanel certification.
|
|
7
|
+
* - 25,000 users over 180 days, ~5M events
|
|
8
|
+
* - Events: checkout (array-of-object cart), add to cart, view/save items
|
|
9
|
+
* - Nested product arrays with product_id lookups
|
|
10
|
+
* - Location, browser, session tracking enabled
|
|
11
|
+
*
|
|
12
|
+
* ═══════════════════════════════════════════════════════════════
|
|
13
|
+
* ANALYTICS HOOKS (1 pattern)
|
|
14
|
+
* ═══════════════════════════════════════════════════════════════
|
|
15
|
+
*
|
|
16
|
+
* 1. EVENT DUPLICATION (everything hook)
|
|
17
|
+
* Every user gets ~3-7 random events duplicated, simulating
|
|
18
|
+
* real-world duplicate event ingestion that students must
|
|
19
|
+
* identify and handle in their analysis.
|
|
20
|
+
*/
|
|
21
|
+
|
|
22
|
+
import Chance from 'chance';
|
|
23
|
+
let chance = new Chance();
|
|
24
|
+
import dayjs from "dayjs";
|
|
25
|
+
import utc from "dayjs/plugin/utc.js";
|
|
26
|
+
dayjs.extend(utc);
|
|
27
|
+
import { uid, comma } from 'ak-tools';
|
|
28
|
+
import { pickAWinner, weighNumRange, date, integer, weighChoices } from "../brain/utils/utils.js";
|
|
29
|
+
|
|
30
|
+
const videoCategories = ["funny", "educational", "inspirational", "music", "news", "sports", "cooking", "DIY", "travel", "gaming"];
|
|
31
|
+
const spiritAnimals = ["duck", "dog", "otter", "penguin", "cat", "elephant", "lion", "cheetah", "giraffe", "zebra", "rhino", "hippo", "whale", "dolphin", "shark", "octopus", "squid", "jellyfish", "starfish", "seahorse", "crab", "lobster", "shrimp", "clam", "snail", "slug", "butterfly", "moth", "bee", "wasp", "ant", "beetle", "ladybug", "caterpillar", "centipede", "millipede", "scorpion", "spider", "tarantula", "tick", "mite", "mosquito", "fly", "dragonfly", "damselfly", "grasshopper", "cricket", "locust", "mantis", "cockroach", "termite", "praying mantis", "walking stick", "stick bug", "leaf insect", "lacewing", "aphid", "cicada", "thrips", "psyllid", "scale insect", "whitefly", "mealybug", "planthopper", "leafhopper", "treehopper", "flea", "louse", "bedbug", "flea beetle", "weevil", "longhorn beetle", "leaf beetle", "tiger beetle", "ground beetle", "lady beetle", "firefly", "click beetle", "rove beetle", "scarab beetle", "dung beetle", "stag beetle", "rhinoceros beetle", "hercules beetle", "goliath beetle", "jewel beetle", "tortoise beetle"];
|
|
32
|
+
|
|
33
|
+
/** @type {import('../types.js').Dungeon} */
|
|
34
|
+
const config = {
|
|
35
|
+
token: "",
|
|
36
|
+
seed: "IC3 baby!",
|
|
37
|
+
name: "ic3-capstone",
|
|
38
|
+
numDays: 180, //how many days worth1 of data
|
|
39
|
+
numEvents: 5_000_000, //how many events
|
|
40
|
+
numUsers: 25_000, //how many users
|
|
41
|
+
format: 'json', //csv or json
|
|
42
|
+
region: "US",
|
|
43
|
+
hasAnonIds: true, //if true, anonymousIds are created for each user
|
|
44
|
+
hasSessionIds: true, //if true, hasSessionIds are created for each user
|
|
45
|
+
hasAdSpend: false,
|
|
46
|
+
makeChart: false,
|
|
47
|
+
hasLocation: true,
|
|
48
|
+
hasAndroidDevices: false,
|
|
49
|
+
hasIOSDevices: false,
|
|
50
|
+
hasDesktopDevices: true,
|
|
51
|
+
hasBrowser: true,
|
|
52
|
+
hasCampaigns: false,
|
|
53
|
+
isAnonymous: false,
|
|
54
|
+
alsoInferFunnels: false,
|
|
55
|
+
concurrency: 1,
|
|
56
|
+
batchSize: 250_000,
|
|
57
|
+
writeToDisk: true,
|
|
58
|
+
events: [
|
|
59
|
+
{
|
|
60
|
+
event: "checkout",
|
|
61
|
+
weight: 2,
|
|
62
|
+
properties: {
|
|
63
|
+
currency: pickAWinner(["USD", "CAD", "EUR", "BTC", "ETH", "JPY"], 0),
|
|
64
|
+
coupon: weighChoices(["none", "none", "none", "none", "10%OFF", "20%OFF", "10%OFF", "20%OFF", "30%OFF", "40%OFF", "50%OFF"]),
|
|
65
|
+
cart: makeProducts()
|
|
66
|
+
}
|
|
67
|
+
},
|
|
68
|
+
{
|
|
69
|
+
event: "add to cart",
|
|
70
|
+
weight: 4,
|
|
71
|
+
properties: {
|
|
72
|
+
item: makeProducts(1),
|
|
73
|
+
}
|
|
74
|
+
},
|
|
75
|
+
{
|
|
76
|
+
event: "view item",
|
|
77
|
+
weight: 8,
|
|
78
|
+
properties: {
|
|
79
|
+
item: makeProducts(1)
|
|
80
|
+
}
|
|
81
|
+
},
|
|
82
|
+
{
|
|
83
|
+
event: "save item",
|
|
84
|
+
weight: 5,
|
|
85
|
+
properties: {
|
|
86
|
+
item: makeProducts(1),
|
|
87
|
+
}
|
|
88
|
+
},
|
|
89
|
+
{
|
|
90
|
+
event: "page view",
|
|
91
|
+
weight: 10,
|
|
92
|
+
properties: {
|
|
93
|
+
page: ["/", "/help", "/account", "/watch", "/listen", "/product", "/people", "/peace"],
|
|
94
|
+
}
|
|
95
|
+
},
|
|
96
|
+
{
|
|
97
|
+
event: "watch video",
|
|
98
|
+
weight: 8,
|
|
99
|
+
properties: {
|
|
100
|
+
watchTimeSec: weighNumRange(10, 600, .25),
|
|
101
|
+
}
|
|
102
|
+
},
|
|
103
|
+
{
|
|
104
|
+
event: "like video",
|
|
105
|
+
weight: 6,
|
|
106
|
+
properties: {
|
|
107
|
+
|
|
108
|
+
}
|
|
109
|
+
},
|
|
110
|
+
{
|
|
111
|
+
event: "dislike video",
|
|
112
|
+
weight: 4,
|
|
113
|
+
properties: {
|
|
114
|
+
|
|
115
|
+
}
|
|
116
|
+
},
|
|
117
|
+
{
|
|
118
|
+
event: "sign up",
|
|
119
|
+
weight: 1,
|
|
120
|
+
isFirstEvent: true,
|
|
121
|
+
properties: {
|
|
122
|
+
signupMethod: pickAWinner(["email", "google", "facebook", "twitter", "linkedin", "github"]),
|
|
123
|
+
referral: weighChoices(["none", "none", "none", "friend", "ad", "ad", "ad", "friend", "friend", "friend", "friend"]),
|
|
124
|
+
}
|
|
125
|
+
},
|
|
126
|
+
|
|
127
|
+
],
|
|
128
|
+
funnels: [
|
|
129
|
+
{
|
|
130
|
+
sequence: ["page view", "view item", "save item", "page view", "sign up"],
|
|
131
|
+
conversionRate: 50,
|
|
132
|
+
order: "first-and-last-fixed",
|
|
133
|
+
weight: 1,
|
|
134
|
+
isFirstFunnel: true,
|
|
135
|
+
timeToConvert: 2,
|
|
136
|
+
experiment: false,
|
|
137
|
+
name: "Signup Flow"
|
|
138
|
+
|
|
139
|
+
},
|
|
140
|
+
{
|
|
141
|
+
sequence: ["watch video", "like video", "watch video", "like video"],
|
|
142
|
+
name: "Video Likes",
|
|
143
|
+
conversionRate: 60,
|
|
144
|
+
props: {
|
|
145
|
+
videoCategory: videoCategories,
|
|
146
|
+
quality: ["2160p", "1440p", "1080p", "720p", "480p", "360p", "240p"],
|
|
147
|
+
format: ["mp4", "avi", "mov", "mpg"],
|
|
148
|
+
uploader_id: chance.guid.bind(chance)
|
|
149
|
+
}
|
|
150
|
+
},
|
|
151
|
+
{
|
|
152
|
+
name: "Video Dislikes",
|
|
153
|
+
sequence: ["watch video", "dislike video", "watch video", "dislike video"],
|
|
154
|
+
conversionRate: 20,
|
|
155
|
+
props: {
|
|
156
|
+
videoCategory: videoCategories,
|
|
157
|
+
quality: ["2160p", "1440p", "1080p", "720p", "480p", "360p", "240p"],
|
|
158
|
+
format: ["mp4", "avi", "mov", "mpg"],
|
|
159
|
+
uploader_id: chance.guid.bind(chance)
|
|
160
|
+
}
|
|
161
|
+
},
|
|
162
|
+
{
|
|
163
|
+
name: "eCommerce Purchase",
|
|
164
|
+
sequence: ["view item", "view item", "add to cart", "view item", "add to cart", "checkout"],
|
|
165
|
+
conversionRate: 15,
|
|
166
|
+
requireRepeats: true,
|
|
167
|
+
weight: 10,
|
|
168
|
+
order: "last-fixed",
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
],
|
|
172
|
+
superProps: {
|
|
173
|
+
theme: pickAWinner(["light", "dark", "custom", "light", "dark"]),
|
|
174
|
+
},
|
|
175
|
+
/*
|
|
176
|
+
user properties work the same as event properties
|
|
177
|
+
each key should be an array or function reference
|
|
178
|
+
*/
|
|
179
|
+
userProps: {
|
|
180
|
+
title: chance.profession.bind(chance),
|
|
181
|
+
luckyNumber: weighNumRange(1, 500, .3),
|
|
182
|
+
spiritAnimal: spiritAnimals
|
|
183
|
+
},
|
|
184
|
+
scdProps: {},
|
|
185
|
+
mirrorProps: {},
|
|
186
|
+
/*
|
|
187
|
+
for group analytics keys, we need an array of arrays [[],[],[]]
|
|
188
|
+
each pair represents a group_key and the number of profiles for that key
|
|
189
|
+
*/
|
|
190
|
+
groupKeys: [],
|
|
191
|
+
groupProps: {},
|
|
192
|
+
lookupTables: [{
|
|
193
|
+
key: "luckyNumber",
|
|
194
|
+
entries: 500,
|
|
195
|
+
attributes: {
|
|
196
|
+
present: ["happy", "sad", "angry", "confused", "excited", "bored", "curious", "anxious", "relaxed", "stressed"],
|
|
197
|
+
past: ["joyful", "melancholy", "furious", "puzzled", "thrilled", "weary", "inquiring", "nervous", "calm", "tense"],
|
|
198
|
+
future: ["hopeful", "dreadful", "optimistic", "skeptical", "eager", "lethargic", "inquiring", "apprehensive", "confident", "uneasy"],
|
|
199
|
+
weather: ["sunny", "rainy", "cloudy", "stormy", "snowy", "windy", "foggy", "humid", "dry", "chilly"],
|
|
200
|
+
temperature: weighNumRange(-10, 100)
|
|
201
|
+
|
|
202
|
+
}
|
|
203
|
+
|
|
204
|
+
}],
|
|
205
|
+
hook: function (record, type, meta) {
|
|
206
|
+
|
|
207
|
+
const NOW = dayjs();
|
|
208
|
+
|
|
209
|
+
|
|
210
|
+
if (type === "event") {
|
|
211
|
+
|
|
212
|
+
}
|
|
213
|
+
|
|
214
|
+
if (type === "everything") {
|
|
215
|
+
// every users has ~5 duplicate events
|
|
216
|
+
let numDupes = integer(3, 7);
|
|
217
|
+
if (record.length < numDupes) numDupes = record.length - 1;
|
|
218
|
+
// pick random events to duplicate
|
|
219
|
+
const dupesIndexes = [];
|
|
220
|
+
while (dupesIndexes.length < numDupes) {
|
|
221
|
+
const idx = integer(0, record.length - 1);
|
|
222
|
+
if (!dupesIndexes.includes(idx)) {
|
|
223
|
+
dupesIndexes.push(idx);
|
|
224
|
+
}
|
|
225
|
+
}
|
|
226
|
+
|
|
227
|
+
// duplicate those events
|
|
228
|
+
dupesIndexes.forEach(idx => {
|
|
229
|
+
const eventToDup = record[idx];
|
|
230
|
+
const newEvent = { ...eventToDup };
|
|
231
|
+
record.push(newEvent);
|
|
232
|
+
});
|
|
233
|
+
|
|
234
|
+
|
|
235
|
+
}
|
|
236
|
+
|
|
237
|
+
|
|
238
|
+
|
|
239
|
+
return record;
|
|
240
|
+
}
|
|
241
|
+
};
|
|
242
|
+
|
|
243
|
+
function makeProducts(maxItems = 5) {
|
|
244
|
+
return function () {
|
|
245
|
+
const categories = ["electronics", "books", "clothing", "home", "garden", "toys", "sports", "automotive", "beauty", "health", "grocery", "jewelry", "shoes", "tools", "office supplies"];
|
|
246
|
+
const descriptors = ["brand new", "open box", "refurbished", "used", "like new", "vintage", "antique", "collectible"];
|
|
247
|
+
const suffix = ["item", "product", "good", "merchandise", "thing", "object", "widget", "gadget", "device", "apparatus", "contraption", "instrument", "tool", "implement", "utensil", "appliance", "machine", "equipment", "gear", "kit", "set", "package"];
|
|
248
|
+
const assetPreview = ['.png', '.jpg', '.jpeg', '.heic', '.mp4', '.mov', '.avi'];
|
|
249
|
+
const data = [];
|
|
250
|
+
const numOfItems = integer(1, maxItems);
|
|
251
|
+
|
|
252
|
+
for (var i = 0; i < numOfItems; i++) {
|
|
253
|
+
const category = chance.pickone(categories);
|
|
254
|
+
const descriptor = chance.pickone(descriptors);
|
|
255
|
+
const suffixWord = chance.pickone(suffix);
|
|
256
|
+
const slug = `${descriptor.replace(/\s+/g, '-').toLowerCase()}-${suffixWord.replace(/\s+/g, '-').toLowerCase()}`;
|
|
257
|
+
const asset = chance.pickone(assetPreview);
|
|
258
|
+
|
|
259
|
+
// const product_id = chance.guid();
|
|
260
|
+
const price = integer(1, 100);
|
|
261
|
+
const quantity = integer(1, 5);
|
|
262
|
+
|
|
263
|
+
const item = {
|
|
264
|
+
// product_id: product_id,
|
|
265
|
+
// sku: integer(11111, 99999),
|
|
266
|
+
amount: price,
|
|
267
|
+
quantity: quantity,
|
|
268
|
+
total_value: price * quantity,
|
|
269
|
+
featured: chance.pickone([true, false, false]),
|
|
270
|
+
category: category,
|
|
271
|
+
descriptor: descriptor,
|
|
272
|
+
slug: slug,
|
|
273
|
+
assetPreview: `https://example.com/assets/${slug}${asset}`,
|
|
274
|
+
assetType: asset
|
|
275
|
+
|
|
276
|
+
};
|
|
277
|
+
|
|
278
|
+
data.push(item);
|
|
279
|
+
}
|
|
280
|
+
|
|
281
|
+
return () => [data];
|
|
282
|
+
};
|
|
283
|
+
};
|
|
284
|
+
|
|
285
|
+
|
|
286
|
+
function flip(likelihood = 50) {
|
|
287
|
+
return chance.bool({ likelihood });
|
|
288
|
+
}
|
|
289
|
+
|
|
290
|
+
|
|
291
|
+
export default config;
|