# ================================================================ begin { if (isabsent(@olen)) { @olen = 16; } if (isabsent(@ocount)) { @ocount = 16; } } # ================================================================ for (_, v in $*) { if (string(v) == "inf" || string(v) == "nan") { continue; } int n = strlen(v); if (n >= 2) { str a = substr(v, 0, 0); str b = substr(v, 1, 1); @a_histo[a] += 1; @ab_histo[a][b] += 1; for (int i = 0; i < n-2; i += 1) { str a = substr(v, i, i); str b = substr(v, i+1, i+1); str c = substr(v, i+2, i+2); @abc_histo[a][b][c] += 1; } } } # ================================================================ end { map a_cmf = compute_cmf_from_histo(@a_histo); # Define these in this scope else they'll be scoped to the for-loops. map ab_cmf = {}; map abc_cmf = {}; for (a in @ab_histo) { ab_cmf[a] = compute_cmf_from_histo(@ab_histo[a]); } for (a in @abc_histo) { for (b in @abc_histo[a]) { abc_cmf[a][b] = compute_cmf_from_histo(@abc_histo[a][b]); } } for (int oi = 0; oi < @ocount; oi += 1) { str oa = sample_from_cmf(a_cmf); str ob = sample_from_cmf(ab_cmf[oa]); str out = oa . ob; for (int i = 2; i < @olen; i += 1) { str oc = sample_from_cmf(abc_cmf[oa][ob]); if (oc == "") { break; } out .= oc; oa = ob; ob = oc; } print out; } }