%PDF-1.6
%
1 0 obj
<>
endobj
2 0 obj
<>stream
Nicholas T. Franklin, Michael J. Frank
Compositional clustering in task structure learning
www.ploscompbiol.org
www.ploscompbiol.org
endstream
endobj
3 0 obj
<>/XObject<>>>/CropBox[0 0 612 792]/MediaBox[0 0 612 792]/Parent 12 0 R/Annots 13 0 R/Contents 14 0 R/TrimBox[0 0 612 792]>>
endobj
13 0 obj
[15 0 R 16 0 R 17 0 R 18 0 R 19 0 R 20 0 R 21 0 R 22 0 R 23 0 R 24 0 R 25 0 R 26 0 R 27 0 R 28 0 R]
endobj
15 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref001)>>
endobj
16 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref002)>>
endobj
17 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref003)>>
endobj
18 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref003)>>
endobj
19 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref004)>>
endobj
20 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref003)>>
endobj
21 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref005)>>
endobj
22 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref006)>>
endobj
23 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref009)>>
endobj
24 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref010)>>
endobj
25 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref012)>>
endobj
26 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref001)>>
endobj
27 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref013)>>
endobj
28 0 obj
<>/Border[0 0 0]/A 29 0 R>>
endobj
29 0 obj
<>
endobj
14 0 obj
[30 0 R 31 0 R 32 0 R 33 0 R 34 0 R 35 0 R 36 0 R 37 0 R 38 0 R 39 0 R 40 0 R 41 0 R]
endobj
30 0 obj
<>stream
q
0.955 g
0 w
199.9998 713.9999 m
575.9997 713.9999 l
575.9997 559.0003 l
199.9998 559.0003 l
f*
0.83 0.64 0.02 0 k
203.4142 458.9291 m
208.1764 458.9291 l
h
f*
415.1622 432.9071 m
419.9244 432.9071 l
h
f*
424.3465 432.9071 m
429.1087 432.9071 l
h
f*
225.411 328.9323 m
230.1732 328.9323 l
h
f*
234.652 328.9323 m
239.4142 328.9323 l
h
f*
518.4 263.9055 m
523.1622 263.9055 l
h
f*
528.3213 263.9055 m
533.0835 263.9055 l
h
f*
488.863 211.9181 m
493.6252 211.9181 l
h
f*
498.7843 211.9181 m
503.5465 211.9181 l
h
f*
387.9496 159.9307 m
397.474 159.9307 l
h
f*
402.6331 159.9307 m
412.1575 159.9307 l
h
f*
393.1087 81.9213 m
397.8709 81.9213 l
h
f*
402.2929 81.9213 m
411.8173 81.9213 l
h
f*
0 g
1 j
1 J
10 0 0 10 209.9905 696.9826 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(frameworks)Tj
4.9776 0 Td
(of)Tj
1.0148 0 Td
(learning,)Tj
3.7473 0 Td
(forcing)Tj
3.0954 0 Td
(agents)Tj
2.7496 0 Td
(either)Tj
2.5285 0 Td
(to)Tj
1.0262 0 Td
(generalize)Tj
4.2349 0 Td
(entire)Tj
2.5512 0 Td
(learned)Tj
3.1974 0 Td
(policies)Tj
3.2315 0 Td
(or)Tj
1.0998 0 Td
(to)Tj
-33.4542 -1.2982 Td
(learn)Tj
2.245 0 Td
(new)Tj
1.8765 0 Td
(policies)Tj
3.2315 0 Td
(from)Tj
2.2053 0 Td
(scratch.)Tj
3.2882 0 Td
(Here,)Tj
2.4264 0 Td
(we)Tj
1.3323 0 Td
(propose)Tj
3.4242 0 Td
(a)Tj
0.652 0 Td
(solution)Tj
3.4809 0 Td
(to)Tj
1.0262 0 Td
(this)Tj
1.6724 0 Td
(problem)Tj
3.6113 0 Td
(that)Tj
1.7801 0 Td
(allows)Tj
-32.2523 -1.2983 Td
(an)Tj
1.2018 0 Td
(agent)Tj
2.3925 0 Td
(to)Tj
1.0261 0 Td
(generalize)Tj
4.2349 0 Td
(components)Tj
5.1761 0 Td
(of)Tj
1.0148 0 Td
(a)Tj
0.6519 0 Td
(policy)Tj
2.6362 0 Td
(independently)Tj
5.9754 0 Td
(and)Tj
1.7291 0 Td
(compare)Tj
3.7191 0 Td
(it)Tj
0.7823 0 Td
(to)Tj
1.0262 0 Td
(an)Tj
1.2018 0 Td
(agent)Tj
-32.7682 -1.3039 Td
(that)Tj
1.7801 0 Td
(generalizes)Tj
4.5978 0 Td
(components)Tj
5.1703 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.6577 0 Td
(whole.)Tj
2.8346 0 Td
(We)Tj
1.6044 0 Td
(show)Tj
2.3017 0 Td
(that)Tj
1.7801 0 Td
(the)Tj
1.4684 0 Td
(degree)Tj
2.8573 0 Td
(to)Tj
1.0205 0 Td
(which)Tj
2.6532 0 Td
(one)Tj
1.7007 0 Td
(form)Tj
2.2054 0 Td
(of)Tj
-33.647 -1.2983 Td
(generalization)Tj
5.8676 0 Td
(is)Tj
0.8504 0 Td
(favored)Tj
3.2258 0 Td
(over)Tj
1.9729 0 Td
(the)Tj
1.474 0 Td
(other)Tj
2.3471 0 Td
(is)Tj
0.8447 0 Td
(dependent)Tj
4.4617 0 Td
(on)Tj
1.2756 0 Td
(the)Tj
1.4683 0 Td
(features)Tj
3.3449 0 Td
(of)Tj
1.0148 0 Td
(task)Tj
1.8142 0 Td
(domain,)Tj
3.5489 0 Td
(with)Tj
-33.5109 -1.2982 Td
(independent)Tj
5.278 0 Td
(generalization)Tj
5.862 0 Td
(of)Tj
1.0148 0 Td
(task)Tj
1.8142 0 Td
(components)Tj
5.1704 0 Td
(favored)Tj
3.2258 0 Td
(in)Tj
1.0374 0 Td
(environments)Tj
5.794 0 Td
(with)Tj
1.9956 0 Td
(weak)Tj
2.2564 0 Td
(rela-)Tj
-33.4486 -1.3039 Td
(tionships)Tj
3.8777 0 Td
(between)Tj
3.5263 0 Td
(components)Tj
5.176 0 Td
(or)Tj
1.0942 0 Td
(high)Tj
2.0126 0 Td
(degrees)Tj
3.2144 0 Td
(of)Tj
1.0148 0 Td
(noise)Tj
2.3244 0 Td
(and)Tj
1.7348 0 Td
(joint)Tj
2.0977 0 Td
(generalization)Tj
5.862 0 Td
(of)Tj
1.0148 0 Td
(task)Tj
-32.9497 -1.2983 Td
(components)Tj
5.176 0 Td
(favored)Tj
3.2258 0 Td
(when)Tj
2.4038 0 Td
(there)Tj
2.262 0 Td
(is)Tj
0.8504 0 Td
(a)Tj
0.6519 0 Td
(clear,)Tj
2.3471 0 Td
(discoverable)Tj
5.1647 0 Td
(relationship)Tj
4.9889 0 Td
(between)Tj
3.5263 0 Td
(task)Tj
1.8142 0 Td
(compo-)Tj
-32.4111 -1.2983 Td
(nents.)Tj
2.6248 0 Td
(Furthermore,)Tj
5.6182 0 Td
(we)Tj
1.3267 0 Td
(show)Tj
2.296 0 Td
(that)Tj
1.7801 0 Td
(the)Tj
1.4684 0 Td
(overall)Tj
2.9026 0 Td
(meta)Tj
2.1997 0 Td
(structure)Tj
3.8211 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(environment)Tj
5.4312 0 Td
(can)Tj
1.6271 0 Td
(be)Tj
-33.579 -1.2982 Td
(learned)Tj
3.1974 0 Td
(and)Tj
1.7291 0 Td
(leveraged)Tj
3.9912 0 Td
(by)Tj
1.1792 0 Td
(an)Tj
1.2019 0 Td
(agent)Tj
2.3924 0 Td
(that)Tj
1.7745 0 Td
(dynamically)Tj
5.0796 0 Td
(arbitrates)Tj
3.9855 0 Td
(between)Tj
3.5263 0 Td
(these)Tj
2.2564 0 Td
(forms)Tj
2.5681 0 Td
(of)Tj
-32.8816 -1.304 Td
(structure)Tj
3.821 0 Td
(learning.)Tj
ET
Q
q
1 j
1 J
0 w
11.9999 0 0 11.9999 200.0125 516.0188 cm
BT
/F2 1 Tf
1 TL
-0.0033 Tc
0 0 Td
(Introduction)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 200.0125 499.011 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(Compared)Tj
4.4843 0 Td
(to)Tj
1.0262 0 Td
(artificial)Tj
3.5149 0 Td
(agents,)Tj
2.9764 0 Td
(humans)Tj
3.4355 0 Td
(exhibit)Tj
2.9764 0 Td
(remarkable)Tj
4.7452 0 Td
(flexibility)Tj
3.9514 0 Td
(in)Tj
1.0375 0 Td
(our)Tj
1.6271 0 Td
(ability)Tj
2.6929 0 Td
(to)Tj
1.0261 0 Td
(rapidly,)Tj
-33.4939 -1.3039 Td
(spontaneously)Tj
5.9527 0 Td
(and)Tj
1.7291 0 Td
(appropriately)Tj
5.5785 0 Td
(learn)Tj
2.2451 0 Td
(to)Tj
1.0261 0 Td
(behave)Tj
2.9934 0 Td
(in)Tj
1.0318 0 Td
(unfamiliar)Tj
4.4277 0 Td
(situations,)Tj
4.3143 0 Td
(by)Tj
1.1792 0 Td
(generalizing)Tj
5.0966 0 Td
(past)Tj
-35.5745 -1.2982 Td
(experience)Tj
4.507 0 Td
(and)Tj
1.7291 0 Td
(performing)Tj
4.7962 0 Td
(symbolic-like)Tj
5.5899 0 Td
(operations)Tj
4.456 0 Td
(on)Tj
1.2756 0 Td
(constituent)Tj
4.7225 0 Td
(components)Tj
5.176 0 Td
(of)Tj
1.0148 0 Td
(knowledge)Tj
-33.2671 -1.2983 Td
([)Tj
0.83 0.64 0.02 0 k
(1)Tj
0 g
(].)Tj
1.5987 0 Td
(Formal)Tj
3.1294 0 Td
(models)Tj
3.1011 0 Td
(of)Tj
1.0148 0 Td
(human)Tj
3.0784 0 Td
(learning)Tj
3.5263 0 Td
(have)Tj
2.0579 0 Td
(cast)Tj
1.7405 0 Td
(generalization)Tj
5.862 0 Td
(as)Tj
1.0148 0 Td
(an)Tj
1.2075 0 Td
(inference)Tj
3.9345 0 Td
(problem)Tj
3.6113 0 Td
(in)Tj
-34.8772 -1.2983 Td
(which)Tj
2.6475 0 Td
(people)Tj
2.8573 0 Td
(learn)Tj
2.245 0 Td
(a)Tj
0.652 0 Td
(shared)Tj
2.863 0 Td
(\(latent\))Tj
3.1521 0 Td
(task)Tj
1.8085 0 Td
(structure)Tj
3.821 0 Td
(across)Tj
2.6816 0 Td
(multiple)Tj
3.566 0 Td
(contexts)Tj
3.5432 0 Td
(and)Tj
1.7292 0 Td
(then)Tj
2.0182 0 Td
(infer)Tj
-33.5846 -1.3039 Td
(which)Tj
2.6475 0 Td
(causal)Tj
2.6475 0 Td
(structure)Tj
3.8211 0 Td
(best)Tj
1.8142 0 Td
(suits)Tj
2.0352 0 Td
(the)Tj
1.4684 0 Td
(current)Tj
3.1804 0 Td
(scenario)Tj
3.5603 0 Td
([)Tj
0.83 0.64 0.02 0 k
(2)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.2586 0 Td
(3)Tj
0 g
(].)Tj
1.2642 0 Td
(In)Tj
1.1055 0 Td
(these)Tj
2.2564 0 Td
(models,)Tj
3.3279 0 Td
(a)Tj
0.6519 0 Td
(context,)Tj
3.4129 0 Td
(typi-)Tj
-34.452 -1.2982 Td
(cally)Tj
2.0239 0 Td
(an)Tj
1.2019 0 Td
(observable)Tj
4.456 0 Td
(\(or)Tj
1.44 0 Td
(partially)Tj
3.4866 0 Td
(observable\))Tj
4.7962 0 Td
(feature)Tj
2.9877 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(environment,)Tj
5.6522 0 Td
(is)Tj
0.8504 0 Td
(linked)Tj
2.7326 0 Td
(to)Tj
1.0205 0 Td
(a)Tj
0.6576 0 Td
(learnable)Tj
-33.7887 -1.2983 Td
(set)Tj
1.3039 0 Td
(of)Tj
1.0148 0 Td
(task)Tj
1.8085 0 Td
(statistics)Tj
3.5886 0 Td
(or)Tj
1.0998 0 Td
(rules.)Tj
2.3755 0 Td
(Based)Tj
2.5455 0 Td
(on)Tj
1.2755 0 Td
(statistics)Tj
3.5887 0 Td
(and)Tj
1.7291 0 Td
(the)Tj
1.4683 0 Td
(opportunity)Tj
5.0343 0 Td
(for)Tj
1.389 0 Td
(generalization,)Tj
6.0945 0 Td
(the)Tj
-34.316 -1.3039 Td
(learner)Tj
3.0387 0 Td
(has)Tj
1.542 0 Td
(to)Tj
1.0261 0 Td
(infer)Tj
2.1147 0 Td
(which)Tj
2.6532 0 Td
(environmental)Tj
6.1114 0 Td
(features)Tj
3.3449 0 Td
(\(stimulus)Tj
3.9685 0 Td
(dimensions,)Tj
5.0796 0 Td
(episodes,)Tj
3.8325 0 Td
(etc.\))Tj
1.9275 0 Td
(should)Tj
-34.6391 -1.2983 Td
(constitute)Tj
4.1725 0 Td
(the)Tj
1.4684 0 Td
(context)Tj
3.1861 0 Td
(that)Tj
1.7801 0 Td
(signals)Tj
2.9027 0 Td
(the)Tj
1.4683 0 Td
(overall)Tj
2.9027 0 Td
(task)Tj
1.8085 0 Td
(structure,)Tj
4.0478 0 Td
(and,)Tj
1.9559 0 Td
(simultaneously,)Tj
6.4686 0 Td
(which)Tj
2.6476 0 Td
(fea-)Tj
-34.8092 -1.2983 Td
(tures)Tj
2.1996 0 Td
(are)Tj
1.4514 0 Td
(indicative)Tj
4.1328 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(specific)Tj
3.1918 0 Td
(appropriate)Tj
4.8755 0 Td
(behaviors)Tj
4.0762 0 Td
(for)Tj
1.3833 0 Td
(the)Tj
1.4684 0 Td
(inferred)Tj
3.4412 0 Td
(task)Tj
1.8085 0 Td
(structure.)Tj
4.0535 0 Td
(This)Tj
-34.5654 -1.3039 Td
(learning)Tj
3.5206 0 Td
(strategy)Tj
3.3278 0 Td
(is)Tj
0.8504 0 Td
(well)Tj
1.8198 0 Td
(captured)Tj
3.7417 0 Td
(by)Tj
1.1849 0 Td
(Bayesian)Tj
3.719 0 Td
(nonparametric)Tj
6.1852 0 Td
(models,)Tj
3.3279 0 Td
(and)Tj
1.7347 0 Td
(neural)Tj
2.7723 0 Td
(network)Tj
-32.1843 -1.2982 Td
(approximations)Tj
6.5309 0 Td
(thereof,)Tj
3.2882 0 Td
(that)Tj
1.7745 0 Td
(impose)Tj
3.1181 0 Td
(a)Tj
0.6519 0 Td
(hierarchical)Tj
4.938 0 Td
(clustering)Tj
4.1555 0 Td
(process)Tj
3.1805 0 Td
(onto)Tj
2.0806 0 Td
(learning)Tj
3.5263 0 Td
(task)Tj
1.8085 0 Td
(struc-)Tj
-35.053 -1.2983 Td
(tures)Tj
2.1996 0 Td
([)Tj
0.83 0.64 0.02 0 k
(3)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.2643 0 Td
(4)Tj
0 g
(].)Tj
1.2585 0 Td
(A)Tj
0.9071 0 Td
(learner)Tj
3.0331 0 Td
(infers)Tj
2.4831 0 Td
(the)Tj
1.4683 0 Td
(probability)Tj
4.5978 0 Td
(that)Tj
1.7802 0 Td
(two)Tj
1.7064 0 Td
(contexts)Tj
3.5433 0 Td
(are)Tj
1.4513 0 Td
(members)Tj
3.9458 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(same)Tj
2.262 0 Td
(task)Tj
-34.384 -1.2983 Td
(cluster)Tj
2.8686 0 Td
(via)Tj
1.3776 0 Td
(Bayesian)Tj
3.7247 0 Td
(inference,)Tj
4.1613 0 Td
(and)Tj
1.7291 0 Td
(in)Tj
1.0375 0 Td
(novel)Tj
2.398 0 Td
(situations,)Tj
4.3144 0 Td
(has)Tj
1.542 0 Td
(a)Tj
0.6576 0 Td
(prior)Tj
2.2507 0 Td
(to)Tj
1.0262 0 Td
(reapply)Tj
3.1861 0 Td
(the)Tj
1.4683 0 Td
(task)Tj
1.8085 0 Td
(structures)Tj
-33.5506 -1.3039 Td
(that)Tj
1.7744 0 Td
(have)Tj
2.0636 0 Td
(been)Tj
2.1203 0 Td
(more)Tj
2.3414 0 Td
(popular)Tj
3.3392 0 Td
(across)Tj
2.6816 0 Td
(disparate)Tj
3.8551 0 Td
(contexts,)Tj
3.77 0 Td
(while)Tj
2.3698 0 Td
(also)Tj
1.7631 0 Td
(allowing)Tj
3.6227 0 Td
(for)Tj
1.3833 0 Td
(the)Tj
1.4683 0 Td
(potential)Tj
3.7644 0 Td
(to)Tj
-36.3172 -1.2982 Td
(create)Tj
2.5908 0 Td
(a)Tj
0.6576 0 Td
(new)Tj
1.8766 0 Td
(structure)Tj
3.821 0 Td
(as)Tj
1.0148 0 Td
(needed.)Tj
3.3222 0 Td
(Empirical)Tj
4.1329 0 Td
(studies)Tj
2.9877 0 Td
(have)Tj
2.0579 0 Td
(provided)Tj
3.8154 0 Td
(evidence)Tj
3.7134 0 Td
(that)Tj
1.7802 0 Td
(humans)Tj
3.4355 0 Td
(spon-)Tj
-35.206 -1.2983 Td
(taneously)Tj
4.0195 0 Td
(impute)Tj
3.0727 0 Td
(such)Tj
2.0636 0 Td
(hierarchical)Tj
4.9323 0 Td
(structure,)Tj
4.0478 0 Td
(which)Tj
2.6532 0 Td
(facilitates)Tj
3.9628 0 Td
(future)Tj
2.6532 0 Td
(transfer,)Tj
3.5433 0 Td
(whether)Tj
3.4753 0 Td
(or)Tj
1.0998 0 Td
(not)Tj
-35.5235 -1.3039 Td
(it)Tj
0.7823 0 Td
(is)Tj
0.8504 0 Td
(immediately)Tj
5.1987 0 Td
(beneficialand,)Tj
6.7124 0 Td
(indeed,)Tj
3.1634 0 Td
(even)Tj
2.0693 0 Td
(if)Tj
0.7767 0 Td
(it)Tj
0.7824 0 Td
(is)Tj
0.8504 0 Td
(costlyto)Tj
4.2406 0 Td
(initial)Tj
2.5455 0 Td
(learning)Tj
3.5262 0 Td
([)Tj
0.83 0.64 0.02 0 k
(3)Tj
0 g
()Tj
0.83 0.64 0.02 0 k
(5)Tj
0 g
(].)Tj
-30.3021 -1.2983 Td
(These)Tj
2.5681 0 Td
(clustering)Tj
4.1556 0 Td
(models)Tj
3.1011 0 Td
(can)Tj
1.6271 0 Td
(account)Tj
3.3845 0 Td
(for)Tj
1.3833 0 Td
(aspects)Tj
3.0387 0 Td
(of)Tj
1.0148 0 Td
(human)Tj
3.0784 0 Td
(generalization)Tj
5.8677 0 Td
(that)Tj
1.7802 0 Td
(are)Tj
1.4456 0 Td
(not)Tj
1.5761 0 Td
(well)Tj
-35.2174 -1.2983 Td
(explained)Tj
4.0705 0 Td
(by)Tj
1.1848 0 Td
(standard)Tj
3.7191 0 Td
(models)Tj
3.1067 0 Td
(of)Tj
1.0148 0 Td
(learning.)Tj
3.7474 0 Td
(This)Tj
1.9899 0 Td
(approach)Tj
3.9515 0 Td
(to)Tj
1.0261 0 Td
(generalization,)Tj
6.0945 0 Td
(treating)Tj
3.3222 0 Td
(multiple)Tj
-33.2275 -1.3039 Td
(contexts)Tj
3.5432 0 Td
(as)Tj
1.0148 0 Td
(sharing)Tj
3.1975 0 Td
(a)Tj
0.652 0 Td
(common)Tj
3.8437 0 Td
(task)Tj
1.8142 0 Td
(structure,)Tj
4.0478 0 Td
(is)Tj
0.8447 0 Td
(similar)Tj
2.9877 0 Td
(to)Tj
1.0262 0 Td
(artificial)Tj
3.5149 0 Td
(agents)Tj
2.7496 0 Td
(that)Tj
1.7801 0 Td
(reuse)Tj
2.3244 0 Td
(previously)Tj
-33.3408 -1.2982 Td
(learned)Tj
3.1917 0 Td
(policies)Tj
3.2372 0 Td
(in)Tj
1.0318 0 Td
(novel)Tj
2.4038 0 Td
(tasks)Tj
2.1656 0 Td
(when)Tj
2.4038 0 Td
(the)Tj
1.474 0 Td
(statistics)Tj
3.5886 0 Td
(are)Tj
1.4457 0 Td
(sufficiently)Tj
4.6148 0 Td
(similar)Tj
2.9877 0 Td
([)Tj
0.83 0.64 0.02 0 k
(6)Tj
0 g
()Tj
0.83 0.64 0.02 0 k
(9)Tj
0 g
(].)Tj
2.5965 0 Td
(However,)Tj
4.0762 0 Td
(a)Tj
0.6519 0 Td
(key)Tj
-35.8693 -1.2983 Td
(limitation)Tj
4.1725 0 Td
(to)Tj
1.0262 0 Td
(these)Tj
2.2507 0 Td
(clustering)Tj
4.1555 0 Td
(models)Tj
3.1068 0 Td
(of)Tj
1.0148 0 Td
(generalization)Tj
5.862 0 Td
(is)Tj
0.8504 0 Td
(that)Tj
1.7801 0 Td
(policies)Tj
3.2315 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(agent)Tj
2.3924 0 Td
(are)Tj
1.4457 0 Td
(general-)Tj
-33.7717 -1.3039 Td
(ized)Tj
1.8481 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.6577 0 Td
(unit.)Tj
2.0862 0 Td
(That)Tj
2.092 0 Td
(is,)Tj
1.0715 0 Td
(in)Tj
1.0375 0 Td
(a)Tj
0.6519 0 Td
(new)Tj
1.8766 0 Td
(context,)Tj
3.4072 0 Td
(a)Tj
0.6576 0 Td
(previously)Tj
4.3483 0 Td
(learned)Tj
3.1975 0 Td
(policy)Tj
2.6362 0 Td
(can)Tj
1.6271 0 Td
(either)Tj
2.5285 0 Td
(be)Tj
1.1508 0 Td
(reused)Tj
2.8573 0 Td
(or)Tj
1.0942 0 Td
(a)Tj
-35.841 -1.2983 Td
(new)Tj
1.8765 0 Td
(policy)Tj
2.6362 0 Td
(must)Tj
2.2223 0 Td
(be)Tj
1.1509 0 Td
(learned)Tj
3.1974 0 Td
(from)Tj
2.2054 0 Td
(scratch.)Tj
3.2825 0 Td
(This)Tj
1.9899 0 Td
(can)Tj
1.6271 0 Td
(be)Tj
1.1508 0 Td
(problematic)Tj
5.0343 0 Td
(as)Tj
1.0148 0 Td
(policies)Tj
3.2315 0 Td
(are)Tj
1.4457 0 Td
(often)Tj
2.2903 0 Td
(not)Tj
-34.3556 -1.2983 Td
(robust)Tj
2.7892 0 Td
(to)Tj
1.0262 0 Td
(untrained)Tj
4.1669 0 Td
(variation)Tj
3.804 0 Td
(in)Tj
1.0318 0 Td
(task)Tj
1.8142 0 Td
(structure)Tj
3.8211 0 Td
([)Tj
0.83 0.64 0.02 0 k
(10)Tj
0 g
()Tj
0.83 0.64 0.02 0 k
(12)Tj
0 g
(].)Tj
3.5433 0 Td
(Thus,)Tj
2.4774 0 Td
(a)Tj
0.652 0 Td
(previously)Tj
4.3483 0 Td
(learned)Tj
3.1975 0 Td
(policy)Tj
2.6362 0 Td
(can)Tj
-35.3081 -1.2982 Td
(lead)Tj
1.8481 0 Td
(to)Tj
1.0262 0 Td
(a)Tj
0.6576 0 Td
(poor)Tj
2.1203 0 Td
(outcome)Tj
3.7247 0 Td
(in)Tj
1.0375 0 Td
(a)Tj
0.6519 0 Td
(new)Tj
1.8766 0 Td
(context)Tj
3.1861 0 Td
(even)Tj
2.0693 0 Td
(if)Tj
0.7766 0 Td
(there)Tj
2.2621 0 Td
(is)Tj
0.8504 0 Td
(a)Tj
0.6519 0 Td
(substantial)Tj
4.5014 0 Td
(degree)Tj
2.8573 0 Td
(of)Tj
1.0148 0 Td
(shared)Tj
-31.1128 -1.3039 Td
(structure.)Tj
1.1962 -1.2983 Td
(Because)Tj
3.3958 0 Td
(task)Tj
1.8085 0 Td
(structures)Tj
4.184 0 Td
(are)Tj
1.4513 0 Td
(either)Tj
2.5285 0 Td
(reused)Tj
2.8573 0 Td
(or)Tj
1.0941 0 Td
(not)Tj
1.5761 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.652 0 Td
(whole,)Tj
2.8346 0 Td
(the)Tj
1.474 0 Td
(ability)Tj
2.6929 0 Td
(to)Tj
1.0261 0 Td
(reuse)Tj
2.3244 0 Td
(and)Tj
1.7291 0 Td
(share)Tj
-33.8397 -1.2983 Td
(component)Tj
4.8131 0 Td
(parts)Tj
2.1997 0 Td
(of)Tj
1.0148 0 Td
(knowledge)Tj
4.5411 0 Td
(is)Tj
0.8504 0 Td
(limited;)Tj
3.2938 0 Td
(that)Tj
1.7802 0 Td
(is,)Tj
1.0715 0 Td
(they)Tj
1.9275 0 Td
(are)Tj
1.4457 0 Td
(not)Tj
/F10 1 Tf
1.576 0 Td
[()7()11()15()4()7()10()14()7()4()11()6( )11(\n)]TJ
/F5 1 Tf
(.)Tj
5.879 0 Td
(Compositionality,)Tj
-30.3928 -1.3039 Td
(or)Tj
1.0941 0 Td
(the)Tj
1.474 0 Td
(ability)Tj
2.6929 0 Td
(to)Tj
1.0262 0 Td
(bind)Tj
2.0692 0 Td
(\(compose\))Tj
4.4617 0 Td
(information)Tj
5.074 0 Td
(together)Tj
3.532 0 Td
(in)Tj
1.0374 0 Td
(a)Tj
0.652 0 Td
(rule)Tj
1.7915 0 Td
(governed)Tj
3.9401 0 Td
(way,)Tj
2.0183 0 Td
(has)Tj
1.542 0 Td
(long)Tj
1.9899 0 Td
(been)Tj
-34.3953 -1.2982 Td
(thought)Tj
3.3732 0 Td
(to)Tj
1.0204 0 Td
(be)Tj
1.1509 0 Td
(a)Tj
0.6576 0 Td
(core)Tj
1.9446 0 Td
(aspect)Tj
2.6759 0 Td
(of)Tj
1.0148 0 Td
(human)Tj
3.0784 0 Td
(cognition)Tj
4.0535 0 Td
([)Tj
0.83 0.64 0.02 0 k
(1)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.2586 0 Td
(13)Tj
0 g
(].)Tj
1.7404 0 Td
(Importantly,)Tj
5.2781 0 Td
(ecological)Tj
4.1612 0 Td
(contexts)Tj
3.549 0 Td
(often)Tj
ET
Q
q
1 j
1 J
0 w
576 737.1 m
36 737.1 l
36 737.6 l
576 737.6 l
f*
36 741.2598 169.285 23.6976 re
W* n
q
169.2283 0 0 23.6409 36 741.3165 cm
q
/I0 Do
Q
Q
Q
q
0 0 612 792 re
W* n
1 j
1 J
0 w
7.9999 0 0 7.9999 404.844 745.7952 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(Composit)Tj
4.1527 0 Td
(ional)Tj
2.289 0 Td
(clustering)Tj
4.415 0 Td
(in)Tj
0.978 0 Td
(task)Tj
2.0268 0 Td
(structure)Tj
4.0465 0 Td
(learning)Tj
ET
Q
q
1 j
1 J
0 w
36 48.0002 m
576 48.0002 l
576 47.5002 l
36 47.5002 l
f*
0.83 0.64 0.02 0 k
142.5827 34.9228 m
295.8236 34.9228 l
h
f*
0 g
7.9999 0 0 7.9999 36 36 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(PLOS)Tj
2.8559 0 Td
(Computationa)Tj
6.1229 0 Td
(l)Tj
0.4322 0 Td
(Biology)Tj
3.4371 0 Td
(|)Tj
0.83 0.64 0.02 0 k
0.4748 0 Td
(https:/)Tj
2.6788 0 Td
(/doi.org/10.13)Tj
6.0094 0 Td
(71/journal.p)Tj
5.1166 0 Td
(cbi.1006116)Tj
0 g
6.3497 0 Td
(April)Tj
2.1756 0 Td
(19,)Tj
1.5874 0 Td
(2018)Tj
27.9002 0 Td
(2)Tj
0.7654 0 Td
(/)Tj
0.496 0 Td
(25)Tj
/F7 1 Tf
-0.025 Tc
-66.402 84.0904 Td
(Competing)Tj
4.3795 0 Td
(interests)Tj
3.3307 0 Td
(:)Tj
/F8 1 Tf
0.4819 0 Td
(The)Tj
1.5875 0 Td
(authors)Tj
3.0401 0 Td
(have)Tj
1.963 0 Td
(declared)Tj
-14.7827 -1.3748 Td
(that)Tj
1.6228 0 Td
(no)Tj
1.1693 0 Td
(competing)Tj
4.1599 0 Td
(interests)Tj
ET
endstream
endobj
31 0 obj
<>stream
endstream
endobj
32 0 obj
<>stream
endstream
endobj
33 0 obj
<>stream
endstream
endobj
34 0 obj
<>stream
endstream
endobj
35 0 obj
<>stream
endstream
endobj
36 0 obj
<>stream
endstream
endobj
37 0 obj
<>stream
endstream
endobj
38 0 obj
<>stream
endstream
endobj
39 0 obj
<>stream
endstream
endobj
40 0 obj
<>stream
endstream
endobj
41 0 obj
<>stream
BT
10.3394 82.7156 Td
(exist.)Tj
ET
Q
endstream
endobj
42 0 obj
<>/XObject<>>>/CropBox[0 0 612 792]/MediaBox[0 0 612 792]/Parent 12 0 R/Annots 43 0 R/Contents 44 0 R/TrimBox[0 0 612 792]>>
endobj
43 0 obj
[45 0 R 46 0 R 47 0 R]
endobj
45 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref003)>>
endobj
46 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref005)>>
endobj
47 0 obj
<>/Border[0 0 0]/A 48 0 R>>
endobj
48 0 obj
<>
endobj
44 0 obj
[49 0 R 50 0 R 51 0 R 52 0 R]
endobj
49 0 obj
<>stream
q
0.83 0.64 0.02 0 k
438.1795 316.3465 m
442.9417 316.3465 l
h
f*
448.1008 316.3465 m
452.863 316.3465 l
h
f*
0 g
1 j
1 J
0 w
10 0 0 10 200.0125 707.4141 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(share)Tj
2.3357 0 Td
(a)Tj
0.6519 0 Td
(partial)Tj
2.7893 0 Td
(structure,)Tj
4.0479 0 Td
(limiting)Tj
3.4015 0 Td
(the)Tj
1.4684 0 Td
(applicability)Tj
5.1023 0 Td
(of)Tj
1.0148 0 Td
(previously)Tj
4.3483 0 Td
(learned)Tj
3.1975 0 Td
(policies)Tj
3.2314 0 Td
(but)Tj
1.5534 0 Td
(nonethe-)Tj
-33.1424 -1.3039 Td
(less)Tj
1.61 0 Td
(providing)Tj
4.1442 0 Td
(a)Tj
0.6577 0 Td
(generalization)Tj
5.8677 0 Td
(advantage)Tj
4.2406 0 Td
(to)Tj
1.0204 0 Td
(a)Tj
0.6577 0 Td
(compositional)Tj
5.9243 0 Td
(agent.)Tj
-22.9264 -1.2982 Td
(To)Tj
1.3379 0 Td
(provide)Tj
3.2938 0 Td
(a)Tj
0.652 0 Td
(naturalistic)Tj
4.6942 0 Td
(example,)Tj
3.7757 0 Td
(an)Tj
1.2019 0 Td
(adept)Tj
2.4207 0 Td
(musician)Tj
3.8721 0 Td
(can)Tj
1.6271 0 Td
(transfer)Tj
3.3109 0 Td
(a)Tj
0.6576 0 Td
(learned)Tj
3.1918 0 Td
(song)Tj
2.1033 0 Td
(between)Tj
3.5263 0 Td
(a)Tj
-36.8615 -1.2983 Td
(piano)Tj
2.4944 0 Td
(and)Tj
1.7291 0 Td
(a)Tj
0.652 0 Td
(guitar,)Tj
2.812 0 Td
(even)Tj
2.0692 0 Td
(as)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(two)Tj
1.7121 0 Td
(instruments)Tj
5.0456 0 Td
(require)Tj
3.1068 0 Td
(completely)Tj
4.5807 0 Td
(different)Tj
3.6567 0 Td
(physical)Tj
3.4526 0 Td
(move-)Tj
-33.7944 -1.2983 Td
(ments,)Tj
2.8969 0 Td
(implying)Tj
3.8041 0 Td
(that)Tj
1.7802 0 Td
(goals)Tj
2.2336 0 Td
(can)Tj
1.6215 0 Td
(be)Tj
1.1508 0 Td
(generalized)Tj
4.7679 0 Td
(and)Tj
1.7291 0 Td
(reused)Tj
2.8516 0 Td
(independently)Tj
5.9754 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.474 0 Td
(actions)Tj
3.0557 0 Td
(needed)Tj
-34.3556 -1.3039 Td
(to)Tj
1.0261 0 Td
(achieve)Tj
3.1691 0 Td
(them.)Tj
2.5171 0 Td
(A)Tj
0.9071 0 Td
(clustering)Tj
4.1499 0 Td
(model)Tj
2.7439 0 Td
(that)Tj
1.7802 0 Td
(generalizes)Tj
4.5978 0 Td
(entire)Tj
2.5511 0 Td
(task)Tj
1.8085 0 Td
(structures)Tj
4.1839 0 Td
(cannot)Tj
2.9821 0 Td
(account)Tj
3.3788 0 Td
(for)Tj
-35.7956 -1.2982 Td
(this)Tj
1.6724 0 Td
(behavior,)Tj
3.9401 0 Td
(and)Tj
1.7291 0 Td
(would)Tj
2.7099 0 Td
(require)Tj
3.1125 0 Td
(instead)Tj
3.0784 0 Td
(that)Tj
1.7801 0 Td
(an)Tj
1.2019 0 Td
(agent)Tj
2.3924 0 Td
(would)Tj
2.7099 0 Td
(need)Tj
2.143 0 Td
(to)Tj
1.0261 0 Td
(relearn)Tj
3.0388 0 Td
(a)Tj
0.6519 0 Td
(song)Tj
2.1033 0 Td
(from)Tj
-33.2898 -1.2983 Td
(scratch)Tj
3.05 0 Td
(to)Tj
1.0148 0 Td
(play)Tj
1.8652 0 Td
(it)Tj
0.7767 0 Td
(on)Tj
1.2642 0 Td
(a)Tj
0.6463 0 Td
(new)Tj
1.8652 0 Td
(instrument.)Tj
4.9039 0 Td
(Worse,)Tj
3.0614 0 Td
(this)Tj
1.6668 0 Td
(clustering)Tj
4.1442 0 Td
(scheme)Tj
3.1861 0 Td
(would)Tj
2.7043 0 Td
(predict)Tj
3.0387 0 Td
(an)Tj
1.1962 0 Td
(unlikely)Tj
-34.384 -1.3039 Td
(interference)Tj
5.0286 0 Td
(effect)Tj
2.3641 0 Td
(where)Tj
2.6532 0 Td
(the)Tj
1.4683 0 Td
(similar)Tj
2.9877 0 Td
(outcome)Tj
3.7247 0 Td
(of)Tj
1.0148 0 Td
(playing)Tj
3.1521 0 Td
(the)Tj
1.4683 0 Td
(same)Tj
2.2621 0 Td
(song)Tj
2.0976 0 Td
(on)Tj
1.2756 0 Td
(two)Tj
1.7121 0 Td
(instruments)Tj
-31.2092 -1.2983 Td
(results)Tj
2.8062 0 Td
(in)Tj
1.0375 0 Td
(the)Tj
1.4683 0 Td
(model)Tj
2.744 0 Td
(incorrectly)Tj
4.558 0 Td
(pooling)Tj
3.2769 0 Td
(motor)Tj
2.7212 0 Td
(policies)Tj
3.2315 0 Td
(across)Tj
2.6815 0 Td
(instruments.)Tj
-23.3289 -1.2983 Td
(Here,)Tj
2.4321 0 Td
(we)Tj
1.3266 0 Td
(propose)Tj
3.4242 0 Td
(a)Tj
0.6576 0 Td
(framework)Tj
4.6148 0 Td
(to)Tj
1.0262 0 Td
(address)Tj
3.2258 0 Td
(one)Tj
1.6951 0 Td
(aspect)Tj
2.6815 0 Td
(of)Tj
1.0148 0 Td
(compositionality)Tj
6.9449 0 Td
(by)Tj
1.1792 0 Td
(decomposing)Tj
-31.419 -1.3039 Td
(task)Tj
1.8084 0 Td
(structuresand)Tj
6.6161 0 Td
(their)Tj
2.1089 0 Td
(separable)Tj
3.9402 0 Td
(potential)Tj
3.7587 0 Td
(for)Tj
1.3889 0 Td
(clusteringinto)Tj
6.6954 0 Td
(reward)Tj
3.0331 0 Td
(functions)Tj
3.9855 0 Td
(and)Tj
1.7348 0 Td
(tran-)Tj
-35.07 -1.2982 Td
(sition)Tj
2.4661 0 Td
(functions.)Tj
4.2179 0 Td
(These)Tj
2.5682 0 Td
(two)Tj
1.7064 0 Td
(independent)Tj
5.2724 0 Td
(functions)Tj
3.9912 0 Td
(of)Tj
1.0148 0 Td
(a)Tj
0.6576 0 Td
(Markov)Tj
3.3732 0 Td
(decision)Tj
3.5433 0 Td
(process)Tj
3.1861 0 Td
(are)Tj
1.4514 0 Td
(suitable)Tj
-33.4486 -1.2983 Td
(units)Tj
2.2223 0 Td
(of)Tj
1.0148 0 Td
(generalization:)Tj
6.0944 0 Td
(if)Tj
0.7711 0 Td
(we)Tj
1.3266 0 Td
(assume)Tj
3.1464 0 Td
(that)Tj
1.7802 0 Td
(an)Tj
1.2018 0 Td
(agent)Tj
2.3925 0 Td
(has)Tj
1.542 0 Td
(knowledge)Tj
4.5411 0 Td
(of)Tj
1.0148 0 Td
(a)Tj
0.6519 0 Td
(state-space)Tj
4.5468 0 Td
(and)Tj
1.7291 0 Td
(the)Tj
1.474 0 Td
(set)Tj
1.2983 0 Td
(of)Tj
-36.7481 -1.3039 Td
(available)Tj
3.668 0 Td
(actions,)Tj
3.2825 0 Td
(then)Tj
2.0182 0 Td
(the)Tj
1.4683 0 Td
(reward)Tj
3.0331 0 Td
(and)Tj
1.7291 0 Td
(transition)Tj
4.1216 0 Td
(functions)Tj
3.9911 0 Td
(are)Tj
1.4457 0 Td
(sufficient)Tj
3.9174 0 Td
(to)Tj
1.0205 0 Td
(determine)Tj
4.3257 0 Td
(the)Tj
1.4683 0 Td
(opti-)Tj
-35.4895 -1.2983 Td
(mal)Tj
1.7177 0 Td
(policy.)Tj
2.863 0 Td
(In)Tj
1.1055 0 Td
(real-world)Tj
4.3823 0 Td
(scenarios,)Tj
4.1443 0 Td
(a)Tj
0.6519 0 Td
(reward)Tj
3.0331 0 Td
(function)Tj
3.6283 0 Td
(may)Tj
1.9276 0 Td
(correspond)Tj
4.7791 0 Td
(to)Tj
1.0262 0 Td
(the)Tj
1.4683 0 Td
(objective)Tj
3.7814 0 Td
(of)Tj
1.0148 0 Td
(an)Tj
-35.5235 -1.2982 Td
(agent)Tj
2.3867 0 Td
(\(what)Tj
2.5058 0 Td
(it)Tj
0.788 0 Td
(would)Tj
2.7099 0 Td
(like)Tj
1.6555 0 Td
(to)Tj
1.0261 0 Td
(achieve)Tj
3.1691 0 Td
(and)Tj
1.7348 0 Td
(the)Tj
1.4683 0 Td
(environmental)Tj
6.1115 0 Td
(states)Tj
2.3924 0 Td
(that)Tj
1.7802 0 Td
(produce)Tj
3.5206 0 Td
(these)Tj
2.2507 0 Td
(goals\).)Tj
2.8006 0 Td
(A)Tj
-36.3002 -1.2983 Td
(transition)Tj
4.1215 0 Td
(function)Tj
3.6283 0 Td
(determines)Tj
4.6828 0 Td
(how)Tj
1.9389 0 Td
(the)Tj
1.4684 0 Td
(agent's)Tj
2.965 0 Td
(actions)Tj
3.0614 0 Td
(affect)Tj
2.3754 0 Td
(its)Tj
1.1452 0 Td
(environment)Tj
5.4311 0 Td
(\(i.e.,)Tj
1.9276 0 Td
(the)Tj
1.4683 0 Td
(subse-)Tj
-34.2139 -1.3039 Td
(quent)Tj
2.5228 0 Td
(states\).)Tj
2.965 0 Td
(For)Tj
1.6214 0 Td
(example,)Tj
3.7757 0 Td
(when)Tj
2.4038 0 Td
(playing)Tj
3.1521 0 Td
(music)Tj
2.6192 0 Td
(a)Tj
0.6576 0 Td
(reward)Tj
3.0331 0 Td
(function)Tj
3.6283 0 Td
(might)Tj
2.5965 0 Td
(correspond)Tj
4.7792 0 Td
(to)Tj
1.0261 0 Td
(the)Tj
-34.7808 -1.2983 Td
(desired)Tj
3.118 0 Td
(sequence)Tj
3.8608 0 Td
(of)Tj
1.0148 0 Td
(notes)Tj
2.3584 0 Td
(\(a)Tj
0.9921 0 Td
(scale,)Tj
2.3358 0 Td
(or)Tj
1.0998 0 Td
(a)Tj
0.652 0 Td
(song\))Tj
2.4434 0 Td
(while)Tj
2.3641 0 Td
(the)Tj
1.474 0 Td
(transition)Tj
4.1215 0 Td
(function)Tj
3.6284 0 Td
(might)Tj
2.5965 0 Td
(correspond)Tj
-32.0596 -1.2983 Td
(to)Tj
1.0261 0 Td
(the)Tj
1.4683 0 Td
(actions)Tj
3.0558 0 Td
(needed)Tj
3.0954 0 Td
(to)Tj
1.0261 0 Td
(produce)Tj
3.5206 0 Td
(notes)Tj
2.3584 0 Td
(on)Tj
1.2756 0 Td
(an)Tj
1.2019 0 Td
(instrument.)Tj
4.9096 0 Td
(When)Tj
2.6872 0 Td
(picking)Tj
3.2031 0 Td
(up)Tj
1.2643 0 Td
(a)Tj
0.6519 0 Td
(new)Tj
1.8765 0 Td
(form)Tj
2.2054 0 Td
(of)Tj
1.0148 0 Td
(gui-)Tj
-35.841 -1.3039 Td
(tar,)Tj
1.5477 0 Td
(it)Tj
0.788 0 Td
(may)Tj
1.9275 0 Td
(be)Tj
1.1509 0 Td
(sufficient)Tj
3.9118 0 Td
(for)Tj
1.3833 0 Td
(a)Tj
0.6576 0 Td
(musician)Tj
3.8664 0 Td
(to)Tj
1.0262 0 Td
(play)Tj
1.8708 0 Td
(one)Tj
1.7008 0 Td
(or)Tj
1.0998 0 Td
(two)Tj
1.7065 0 Td
(strings)Tj
2.8913 0 Td
(which)Tj
2.6532 0 Td
(may)Tj
1.9276 0 Td
(then)Tj
2.0182 0 Td
(afford)Tj
2.6362 0 Td
(infer-)Tj
-34.7638 -1.2982 Td
(ence)Tj
2.0352 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.474 0 Td
(entire)Tj
2.5512 0 Td
(transition)Tj
4.1215 0 Td
(functions)Tj
3.9912 0 Td
(\(the)Tj
1.8085 0 Td
(tuning:)Tj
3.1011 0 Td
(strings)Tj
2.8913 0 Td
(and)Tj
1.7291 0 Td
(frets)Tj
1.9616 0 Td
(needed)Tj
3.0954 0 Td
(to)Tj
1.0261 0 Td
(obtain)Tj
2.7836 0 Td
(each)Tj
-33.5846 -1.2983 Td
(note\).)Tj
2.5625 0 Td
(Here,)Tj
2.4321 0 Td
(we)Tj
1.3266 0 Td
(are)Tj
1.4456 0 Td
(concerned)Tj
4.422 0 Td
(with)Tj
1.9956 0 Td
(how)Tj
1.9389 0 Td
(the)Tj
1.4684 0 Td
(inference)Tj
3.9401 0 Td
(of)Tj
1.0148 0 Td
(one)Tj
1.6951 0 Td
(\(reward)Tj
3.3732 0 Td
(or)Tj
1.0998 0 Td
(transition\))Tj
4.4617 0 Td
(function)Tj
-33.1764 -1.3039 Td
(affects)Tj
2.7325 0 Td
(generalization)Tj
5.8677 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.474 0 Td
(other.)Tj
-9.8928 -1.2983 Td
(We)Tj
1.61 0 Td
(consider)Tj
3.651 0 Td
(two)Tj
1.7121 0 Td
(approaches)Tj
4.7339 0 Td
(to)Tj
1.0261 0 Td
(clustering)Tj
4.1499 0 Td
(and)Tj
1.7348 0 Td
(compare)Tj
3.7134 0 Td
(their)Tj
2.1089 0 Td
(relative)Tj
3.1408 0 Td
(generalization)Tj
5.862 0 Td
(advan-)Tj
-34.6391 -1.2983 Td
(tages)Tj
2.1996 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.6577 0 Td
(function)Tj
3.6283 0 Td
(of)Tj
1.0148 0 Td
(environmental)Tj
6.1114 0 Td
(statistics.)Tj
3.8098 0 Td
(The)Tj
/F10 1 Tf
1.7858 0 Td
[()12()6()4()2()4()2()6()4()2()22()]TJ
5.0116 0 Td
[()13(\n)12(\r)-4()9()11()2()-9()12()13()]TJ
/F5 1 Tf
3.9458 0 Td
(agent)Tj
2.3868 0 Td
(supports)Tj
3.685 0 Td
(gen-)Tj
-35.2514 -1.2982 Td
(eralization)Tj
4.4276 0 Td
(by)Tj
1.1849 0 Td
(clustering)Tj
4.1499 0 Td
(contexts)Tj
3.5433 0 Td
(into)Tj
1.8425 0 Td
(independent)Tj
5.2781 0 Td
(sets)Tj
1.6611 0 Td
(defined)Tj
3.2258 0 Td
(by)Tj
1.1849 0 Td
(the)Tj
1.4683 0 Td
(reward)Tj
3.033 0 Td
(and)Tj
1.7292 0 Td
(transition)Tj
-32.7286 -1.3039 Td
(statistics,)Tj
3.8154 0 Td
(respectively.)Tj
5.108 0 Td
(In)Tj
1.1111 0 Td
(contrast,)Tj
3.685 0 Td
(the)Tj
/F10 1 Tf
1.4684 0 Td
[()3()11()12()22()]TJ
2.0352 0 Td
[()13(\n)12(\r)-4()9()11()2()-9()12()13()]TJ
/F5 1 Tf
3.9459 0 Td
(agent)Tj
2.3867 0 Td
(clusters)Tj
3.2372 0 Td
(contexts)Tj
3.5432 0 Td
(into)Tj
1.8425 0 Td
(a)Tj
0.652 0 Td
(single)Tj
2.5342 0 Td
(set)Tj
1.2982 0 Td
(of)Tj
-36.663 -1.2983 Td
(clusters)Tj
3.2314 0 Td
(that)Tj
1.7802 0 Td
(binds)Tj
2.4321 0 Td
(together)Tj
3.5319 0 Td
(the)Tj
1.4684 0 Td
(transition)Tj
4.1215 0 Td
(and)Tj
1.7291 0 Td
(reward)Tj
3.0331 0 Td
(functions)Tj
3.9911 0 Td
(\(hence)Tj
2.9084 0 Td
(amounting)Tj
4.6318 0 Td
(to)Tj
1.0261 0 Td
(previous)Tj
-33.8851 -1.2983 Td
(models)Tj
3.101 0 Td
(of)Tj
1.0148 0 Td
(task-set)Tj
3.2485 0 Td
(structure)Tj
3.8211 0 Td
(that)Tj
1.7801 0 Td
(cluster)Tj
2.8687 0 Td
(and)Tj
1.7291 0 Td
(re-use)Tj
2.6816 0 Td
(policies)Tj
3.2314 0 Td
([)Tj
0.83 0.64 0.02 0 k
(3)Tj
0 g
()Tj
0.83 0.64 0.02 0 k
(5)Tj
0 g
(]\).)Tj
2.931 0 Td
(Necessarily,)Tj
4.9493 0 Td
(independent)Tj
-31.3566 -1.3039 Td
(clustering)Tj
4.1498 0 Td
(is)Tj
0.8504 0 Td
(compositional)Tj
5.9244 0 Td
(and)Tj
1.7291 0 Td
(requires)Tj
3.4696 0 Td
(the)Tj
1.474 0 Td
(binding)Tj
3.3505 0 Td
(of)Tj
1.0148 0 Td
(two)Tj
1.7065 0 Td
(independent)Tj
5.2781 0 Td
(functions.)Tj
-27.751 -1.2982 Td
(We)Tj
1.6044 0 Td
(show)Tj
2.2903 0 Td
(that)Tj
1.7688 0 Td
(these)Tj
2.2451 0 Td
(two)Tj
1.7008 0 Td
(models)Tj
3.0954 0 Td
(lead)Tj
1.8425 0 Td
(to)Tj
1.0204 0 Td
(different)Tj
3.6454 0 Td
(predictions)Tj
4.7225 0 Td
(depending)Tj
4.4617 0 Td
(on)Tj
1.2699 0 Td
(the)Tj
1.457 0 Td
(task)Tj
1.8028 0 Td
(environ-)Tj
-34.1232 -1.2983 Td
(ment,)Tj
2.5341 0 Td
(and)Tj
1.7291 0 Td
(we)Tj
1.3266 0 Td
(provide)Tj
3.2882 0 Td
(an)Tj
1.2076 0 Td
(information)Tj
5.0739 0 Td
(theoretic)Tj
3.7588 0 Td
(analysis)Tj
3.3278 0 Td
(to)Tj
1.0261 0 Td
(formalize)Tj
3.9912 0 Td
(and)Tj
1.7291 0 Td
(quantify)Tj
3.5433 0 Td
(the)Tj
1.4683 0 Td
(bounds)Tj
-34.0041 -1.3039 Td
(of)Tj
1.0147 0 Td
(these)Tj
2.2507 0 Td
(advantages/disadva)Tj
7.7216 0 Td
(ntages.)Tj
2.9707 0 Td
(In)Tj
1.1111 0 Td
(environments)Tj
5.794 0 Td
(where)Tj
2.6476 0 Td
(there)Tj
2.2677 0 Td
(is)Tj
0.8447 0 Td
(a)Tj
0.6519 0 Td
(clear,)Tj
2.3471 0 Td
(discoverable)Tj
5.1647 0 Td
(rela-)Tj
-34.7865 -1.2983 Td
(tionship)Tj
3.5149 0 Td
(between)Tj
3.5263 0 Td
(transitions)Tj
4.4843 0 Td
(and)Tj
1.7292 0 Td
(rewards,)Tj
3.617 0 Td
(joint)Tj
2.0976 0 Td
(clustering)Tj
4.1555 0 Td
(facilitates)Tj
3.9572 0 Td
(generalization)Tj
5.8677 0 Td
(by)Tj
1.1848 0 Td
(allowing)Tj
-34.1345 -1.2983 Td
(an)Tj
1.2018 0 Td
(agent)Tj
2.3868 0 Td
(to)Tj
1.0261 0 Td
(infer)Tj
2.1203 0 Td
(one)Tj
1.7008 0 Td
(function)Tj
3.6283 0 Td
(based)Tj
2.4718 0 Td
(on)Tj
1.2756 0 Td
(observations)Tj
5.2611 0 Td
(that)Tj
1.7745 0 Td
(are)Tj
1.4513 0 Td
(informative)Tj
4.8982 0 Td
(about)Tj
2.4945 0 Td
(the)Tj
1.4683 0 Td
(other.)Tj
-33.1594 -1.3039 Td
(Nonetheless,)Tj
5.3007 0 Td
(we)Tj
1.3266 0 Td
(show)Tj
2.3017 0 Td
(that)Tj
1.7745 0 Td
(independent)Tj
5.2781 0 Td
(clustering)Tj
4.1499 0 Td
(can)Tj
1.6271 0 Td
(lead)Tj
1.8538 0 Td
(to)Tj
1.0261 0 Td
(superior)Tj
3.566 0 Td
(generalization)Tj
5.8677 0 Td
(even)Tj
2.0693 0 Td
(in)Tj
-36.1415 -1.2982 Td
(such)Tj
2.0579 0 Td
(cases)Tj
2.2223 0 Td
(when)Tj
2.4038 0 Td
(the)Tj
1.4683 0 Td
(transition-reward)Tj
7.285 0 Td
(relationship)Tj
4.989 0 Td
(is)Tj
0.8504 0 Td
(weak,)Tj
2.4831 0 Td
(difficult)Tj
3.3505 0 Td
(to)Tj
1.0262 0 Td
(discover,)Tj
3.7814 0 Td
(or)Tj
1.0998 0 Td
(costly)Tj
2.5115 0 Td
(to)Tj
1.0261 0 Td
(do)Tj
-36.5553 -1.2983 Td
(so.)Tj
1.3095 0 Td
(Finally,)Tj
3.1748 0 Td
(we)Tj
1.3266 0 Td
(develop)Tj
3.3166 0 Td
(a)Tj
0.6576 0 Td
(meta-structure)Tj
6.1455 0 Td
(learning)Tj
3.5262 0 Td
(agent)Tj
2.3868 0 Td
(that)Tj
1.7801 0 Td
(can)Tj
1.6271 0 Td
(infer)Tj
2.1203 0 Td
(whether)Tj
3.4753 0 Td
(the)Tj
1.4683 0 Td
(overall)Tj
2.9027 0 Td
(envi-)Tj
-35.2174 -1.2983 Td
(ronment)Tj
3.736 0 Td
(is)Tj
0.8504 0 Td
(better)Tj
2.5398 0 Td
(described)Tj
4.0535 0 Td
(by)Tj
1.1792 0 Td
(independent)Tj
5.2781 0 Td
(or)Tj
1.0942 0 Td
(joint)Tj
2.0976 0 Td
(statistics.)Tj
ET
Q
q
1 j
1 J
0 w
11.9999 0 0 11.9999 200.0125 151.9937 cm
BT
/F2 1 Tf
1 TL
-0.0033 Tc
0 0 Td
(Models)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 200.0125 134.9858 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(To)Tj
1.3379 0 Td
(provide)Tj
3.2882 0 Td
(a)Tj
0.6519 0 Td
(test-bed)Tj
3.4129 0 Td
(for)Tj
1.3833 0 Td
(characterizing)Tj
5.8904 0 Td
(the)Tj
1.4683 0 Td
(effects)Tj
2.7269 0 Td
(compositional)Tj
5.9244 0 Td
(structure,)Tj
4.0478 0 Td
(we)Tj
1.3266 0 Td
(consider)Tj
3.6511 0 Td
(a)Tj
-35.1097 -1.2982 Td
(series)Tj
2.4264 0 Td
(of)Tj
1.0148 0 Td
(navigation)Tj
4.4447 0 Td
(tasks)Tj
2.1713 0 Td
(by)Tj
1.1792 0 Td
(utilizing)Tj
3.5206 0 Td
(grid)Tj
1.8539 0 Td
(worlds)Tj
2.914 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.6576 0 Td
(simplification)Tj
5.7316 0 Td
(of)Tj
1.0148 0 Td
(real-world)Tj
4.3823 0 Td
(environ-)Tj
-32.326 -1.2983 Td
(ments.)Tj
2.8969 0 Td
(In)Tj
1.1055 0 Td
(these)Tj
2.2564 0 Td
(grid)Tj
1.8482 0 Td
(worlds,)Tj
3.1464 0 Td
(an)Tj
1.2019 0 Td
(agent)Tj
2.3868 0 Td
(learns)Tj
2.6078 0 Td
(to)Tj
1.0262 0 Td
(navigate)Tj
3.5432 0 Td
(by)Tj
1.1792 0 Td
(learning)Tj
3.5263 0 Td
(transition)Tj
4.1216 0 Td
(functions)Tj
3.9911 0 Td
(\(the)Tj
-34.8375 -1.3039 Td
(consequences)Tj
5.6976 0 Td
(of)Tj
1.0147 0 Td
(its)Tj
1.1452 0 Td
(actions)Tj
3.0614 0 Td
(in)Tj
1.0318 0 Td
(terms)Tj
2.4945 0 Td
(of)Tj
1.0148 0 Td
(subsequent)Tj
4.7055 0 Td
(states\))Tj
2.7382 0 Td
(and)Tj
1.7292 0 Td
(separately)Tj
4.1839 0 Td
(learns)Tj
2.6022 0 Td
(a)Tj
0.6576 0 Td
(reward)Tj
3.0331 0 Td
(func-)Tj
-35.1097 -1.2983 Td
(tion)Tj
1.8425 0 Td
(\(the)Tj
1.8085 0 Td
(reward)Tj
3.033 0 Td
(values)Tj
2.6646 0 Td
(of)Tj
1.0147 0 Td
(locations,)Tj
4.0366 0 Td
(or)Tj
1.0998 0 Td
(goals\))Tj
2.5738 0 Td
(as)Tj
1.0148 0 Td
(it)Tj
0.7824 0 Td
(navigates.)Tj
4.1329 0 Td
(At)Tj
1.2019 0 Td
(each)Tj
2.0296 0 Td
(point)Tj
2.3584 0 Td
(in)Tj
1.0374 0 Td
(time,)Tj
2.2507 0 Td
(the)Tj
1.474 0 Td
(agent)Tj
2.3868 0 Td
(is)Tj
ET
Q
q
1 j
1 J
0 w
576 737.1 m
36 737.1 l
36 737.6 l
576 737.6 l
f*
36 741.2598 169.285 23.6976 re
W* n
q
169.2283 0 0 23.6409 36 741.3165 cm
q
/I0 Do
Q
Q
Q
q
0 0 612 792 re
W* n
1 j
1 J
0 w
7.9999 0 0 7.9999 404.844 745.7952 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(Composit)Tj
4.1527 0 Td
(ional)Tj
2.289 0 Td
(clustering)Tj
4.415 0 Td
(in)Tj
0.978 0 Td
(task)Tj
2.0268 0 Td
(structure)Tj
4.0465 0 Td
(learning)Tj
ET
Q
q
1 j
1 J
0 w
36 48.0002 m
576 48.0002 l
576 47.5002 l
36 47.5002 l
f*
0.83 0.64 0.02 0 k
142.5827 34.9228 m
295.8236 34.9228 l
h
f*
0 g
7.9999 0 0 7.9999 36 36 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(PLOS)Tj
2.8559 0 Td
(Computationa)Tj
6.1229 0 Td
(l)Tj
0.4322 0 Td
(Biology)Tj
3.4371 0 Td
(|)Tj
0.83 0.64 0.02 0 k
0.4748 0 Td
(https:/)Tj
2.6788 0 Td
(/doi.org/10.13)Tj
6.0094 0 Td
(71/journal.p)Tj
5.1166 0 Td
(cbi.1006116)Tj
0 g
6.3497 0 Td
(April)Tj
2.1756 0 Td
(19,)Tj
1.5874 0 Td
(2018)Tj
27.9002 0 Td
(3)Tj
0.7654 0 Td
(/)Tj
ET
endstream
endobj
50 0 obj
<>stream
endstream
endobj
51 0 obj
<>stream
endstream
endobj
52 0 obj
<>stream
BT
66.402 0 Td
(25)Tj
ET
Q
endstream
endobj
53 0 obj
<>/XObject<>>>/CropBox[0 0 612 792]/MediaBox[0 0 612 792]/Parent 12 0 R/Annots 63 0 R/Contents 64 0 R/TrimBox[0 0 612 792]>>
endobj
63 0 obj
[65 0 R 66 0 R 67 0 R 68 0 R]
endobj
65 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref014)>>
endobj
66 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref015)>>
endobj
67 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref016)>>
endobj
68 0 obj
<>/Border[0 0 0]/A 69 0 R>>
endobj
69 0 obj
<>
endobj
64 0 obj
[70 0 R 71 0 R 72 0 R 73 0 R 74 0 R 75 0 R]
endobj
70 0 obj
<>stream
q
0.83 0.64 0.02 0 k
343.2756 380.0126 m
352.8 380.0126 l
h
f*
357.222 380.0126 m
366.7465 380.0126 l
h
f*
203.4142 262.9984 m
212.9386 262.9984 l
h
f*
0 g
1 j
1 J
0 w
10 0 0 10 200.0125 706.2236 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(given)Tj
2.3754 0 Td
(a)Tj
0.6576 0 Td
(state)Tj
2.0353 0 Td
(tuple)Tj
/F10 1 Tf
2.2337 0 Td
[()]TJ
/F5 1 Tf
0.5499 0 Td
(=)Tj
/F11 1 Tf
0 Tc
0.7993 0 Td
(<)Tj
/F10 1 Tf
-0.004 Tc
0.9922 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
0.907 0 Td
[()]TJ
/F11 1 Tf
0 Tc
0.5953 0 Td
(>)Tj
/F5 1 Tf
-0.004 Tc
0.9865 0 Td
(where)Tj
/F10 1 Tf
0 Tc
2.6532 0 Td
[()]TJ
/F12 1 Tf
0.7653 0 Td
(2)Tj
/F13 1 Tf
0.9354 0 Td
( 5)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 372.0755 710.6456 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 377.9716 706.2236 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(is)Tj
0.8447 0 Td
(a)Tj
0.6576 0 Td
(vector)Tj
2.6986 0 Td
(of)Tj
1.0148 0 Td
(state)Tj
2.0296 0 Td
(variables)Tj
3.719 0 Td
(\(for)Tj
1.7291 0 Td
(example,)Tj
3.7757 0 Td
(a)Tj
0.652 0 Td
(loca-)Tj
-34.9168 -1.3039 Td
(tion)Tj
1.8425 0 Td
(vector)Tj
2.6929 0 Td
(in)Tj
1.0374 0 Td
(coordinate)Tj
4.5298 0 Td
(space\))Tj
2.7155 0 Td
(and)Tj
/F10 1 Tf
0 Tc
1.7348 0 Td
[()]TJ
/F12 1 Tf
0.652 0 Td
(2)Tj
/F13 1 Tf
0.9354 0 Td
( 5)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 368.6173 697.6629 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 374.5133 693.1842 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(is)Tj
0.8447 0 Td
(a)Tj
0.6519 0 Td
(context)Tj
3.1862 0 Td
(vector.)Tj
2.9253 0 Td
(Here,)Tj
2.4321 0 Td
(we)Tj
1.3266 0 Td
(define)Tj
2.6986 0 Td
(context)Tj
3.9685 0 Td
(as)Tj
1.0147 0 Td
(a)Tj
-36.4985 -1.2982 Td
(vector)Tj
2.6985 0 Td
(denoting)Tj
3.8041 0 Td
(some)Tj
2.3301 0 Td
(mutable)Tj
3.4752 0 Td
(property)Tj
3.6851 0 Td
(of)Tj
1.0147 0 Td
(the)Tj
1.4683 0 Td
(world)Tj
2.5568 0 Td
(\(for)Tj
1.7235 0 Td
(example,)Tj
3.7757 0 Td
(the)Tj
1.4683 0 Td
(presence)Tj
3.7134 0 Td
(or)Tj
1.0998 0 Td
(absence)Tj
3.3392 0 Td
(of)Tj
-36.1527 -1.2983 Td
(rain,)Tj
2.0636 0 Td
(an)Tj
1.2019 0 Td
(episodic)Tj
3.5149 0 Td
(period)Tj
2.8346 0 Td
(of)Tj
1.0148 0 Td
(time,)Tj
2.2564 0 Td
(etc.\))Tj
1.9275 0 Td
(that)Tj
1.7802 0 Td
(constrain)Tj
3.9797 0 Td
(the)Tj
1.4683 0 Td
(statistics)Tj
3.5887 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(task)Tj
1.8142 0 Td
(domain,)Tj
3.5489 0 Td
(whereby)Tj
-33.4768 -1.2982 Td
(these)Tj
2.2507 0 Td
(task)Tj
1.8141 0 Td
(statistics)Tj
3.5887 0 Td
(are)Tj
1.4456 0 Td
(consistent)Tj
4.2576 0 Td
(for)Tj
1.389 0 Td
(each)Tj
2.0239 0 Td
(context)Tj
3.1861 0 Td
(that)Tj
1.7801 0 Td
(cues)Tj
1.9559 0 Td
(the)Tj
1.4683 0 Td
(relevant)Tj
3.4186 0 Td
(task.)Tj
2.0353 0 Td
(Formally,)Tj
4.0535 0 Td
(for)Tj
-34.6674 -1.304 Td
(each)Tj
2.0296 0 Td
(context)Tj
3.1804 0 Td
(we)Tj
1.3266 0 Td
(can)Tj
1.6271 0 Td
(define)Tj
2.6986 0 Td
(a)Tj
0.6576 0 Td
(Markov)Tj
3.3732 0 Td
(decision)Tj
3.5432 0 Td
(process)Tj
3.1861 0 Td
(\(MDP\))Tj
3.0898 0 Td
(with)Tj
1.9955 0 Td
(state)Tj
2.0353 0 Td
(variables)Tj
/F10 1 Tf
3.719 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.686 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8788 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
-34.0268 -1.2982 Td
(actions)Tj
/F10 1 Tf
3.0557 0 Td
[( )]TJ
/F12 1 Tf
0 Tc
0.7087 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8787 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
1.0942 0 Td
(a)Tj
0.6576 0 Td
(reward)Tj
3.0331 0 Td
(function)Tj
3.6283 0 Td
(mapping)Tj
3.787 0 Td
(state)Tj
2.0352 0 Td
(variables)Tj
3.719 0 Td
(and)Tj
1.7292 0 Td
(actions)Tj
3.0614 0 Td
(to)Tj
1.0261 0 Td
(a)Tj
0.652 0 Td
(real)Tj
1.6951 0 Td
(valued)Tj
2.8346 0 Td
(number)Tj
/F10 1 Tf
0 Tc
-33.5959 -1.2983 Td
[()]TJ
/F14 1 Tf
0.873 0 Td
(:)Tj
/F10 1 Tf
0.5443 0 Td
[()]TJ
/F12 1 Tf
0.9127 0 Td
()Tj
/F15 1 Tf
0.9922 0 Td
(A)Tj
/F12 1 Tf
1.0715 0 Td
(!)Tj
/F13 1 Tf
1.2755 0 Td
( 5)Tj
/F5 1 Tf
-0.004 Tc
(,)Tj
1.1679 0 Td
(and)Tj
1.7291 0 Td
(a)Tj
0.652 0 Td
(transition)Tj
4.1215 0 Td
(function)Tj
3.6284 0 Td
(mapping)Tj
3.7926 0 Td
(state)Tj
2.0353 0 Td
(variables)Tj
3.719 0 Td
(and)Tj
1.7291 0 Td
(actions)Tj
3.0557 0 Td
(to)Tj
1.0262 0 Td
(a)Tj
0.6576 0 Td
(probability)Tj
-32.9836 -1.3039 Td
(distribution)Tj
4.9662 0 Td
(over)Tj
1.9786 0 Td
(successors)Tj
/F10 1 Tf
0 Tc
4.337 0 Td
[()]TJ
/F14 1 Tf
0.9468 0 Td
(:)Tj
/F10 1 Tf
0.5499 0 Td
[()]TJ
/F12 1 Tf
0.9071 0 Td
()Tj
/F15 1 Tf
0.9921 0 Td
(A)Tj
/F12 1 Tf
1.0715 0 Td
(!)Tj
/F16 1 Tf
1.2756 0 Td
(P)Tj
/F12 1 Tf
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
1.8991 0 Td
()Tj
/F5 1 Tf
-0.004 Tc
(.)Tj
-17.7277 -1.2983 Td
(For)Tj
1.6271 0 Td
(the)Tj
1.4683 0 Td
(purpose)Tj
3.4469 0 Td
(of)Tj
1.0148 0 Td
(simplicity,)Tj
4.371 0 Td
(we)Tj
1.3266 0 Td
(assume)Tj
3.1464 0 Td
(that)Tj
1.7744 0 Td
(the)Tj
1.474 0 Td
(agent)Tj
2.3868 0 Td
(knows)Tj
2.8176 0 Td
(the)Tj
1.4683 0 Td
(spatial)Tj
2.778 0 Td
(relationship)Tj
-30.2964 -1.2982 Td
(between)Tj
3.5263 0 Td
(states)Tj
2.3981 0 Td
(\(i.e.,)Tj
1.9275 0 Td
(it)Tj
0.7824 0 Td
(has)Tj
1.542 0 Td
(access)Tj
2.6475 0 Td
(to)Tj
1.0262 0 Td
(a)Tj
0.6519 0 Td
(spatial)Tj
2.778 0 Td
(map)Tj
1.9898 0 Td
(of)Tj
1.0148 0 Td
(its)Tj
1.1508 0 Td
(current)Tj
3.1805 0 Td
(position)Tj
3.4979 0 Td
(and)Tj
1.7291 0 Td
(adjacent)Tj
3.566 0 Td
(positions\))Tj
-33.4088 -1.304 Td
(but)Tj
1.5534 0 Td
(has)Tj
1.542 0 Td
(to)Tj
1.0261 0 Td
(learn)Tj
2.2394 0 Td
(how)Tj
1.9389 0 Td
(its)Tj
1.1508 0 Td
(actions)Tj
3.0558 0 Td
(take)Tj
1.8708 0 Td
(it)Tj
0.788 0 Td
(from)Tj
2.2054 0 Td
(one)Tj
1.7007 0 Td
(state)Tj
2.0352 0 Td
(to)Tj
1.0262 0 Td
(another.)Tj
3.5546 0 Td
(Specifically,)Tj
4.9096 0 Td
(we)Tj
1.3266 0 Td
(assume)Tj
3.1464 0 Td
(the)Tj
-35.0699 -1.2982 Td
(agent)Tj
2.3867 0 Td
(knows)Tj
2.8177 0 Td
(a)Tj
0.6576 0 Td
(set)Tj
1.2983 0 Td
(of)Tj
/F10 1 Tf
1.0147 0 Td
[()7( )16()20()12()12()6( )11(\n)]TJ
3.4526 0 Td
[()6()12()3()2()6()2()22()]TJ
0 Tc
4.6148 0 Td
[()]TJ
/F12 1 Tf
0.9354 0 Td
(2)Tj
/F15 1 Tf
0.9354 0 Td
(A)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 389.0834 547.7102 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()7( )16()]TJ
1.2094 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 400.0251 550.2047 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(,)Tj
0.4422 0 Td
(where)Tj
2.6532 0 Td
(each)Tj
2.0296 0 Td
(cardinal)Tj
3.4695 0 Td
(movement)Tj
4.5184 0 Td
(is)Tj
0.8448 0 Td
(a)Tj
0.6519 0 Td
(vector)Tj
-34.6107 -1.3039 Td
(that)Tj
1.7745 0 Td
(defines)Tj
3.0614 0 Td
(a)Tj
0.652 0 Td
(change)Tj
3.0443 0 Td
(in)Tj
1.0375 0 Td
(the)Tj
1.4684 0 Td
(state)Tj
2.0352 0 Td
(variables)Tj
3.7191 0 Td
(with)Tj
1.9955 0 Td
(regard)Tj
2.8119 0 Td
(to)Tj
1.0261 0 Td
(the)Tj
1.4684 0 Td
(known)Tj
3.0047 0 Td
(spatial)Tj
2.7779 0 Td
(structure)Tj
3.8267 0 Td
(per)Tj
1.5307 0 Td
(unit)Tj
-35.2343 -1.3039 Td
(time.)Tj
2.2507 0 Td
(\(For)Tj
1.9672 0 Td
(example,)Tj
3.7758 0 Td
(in)Tj
1.0374 0 Td
(a)Tj
0.652 0 Td
(two)Tj
1.7121 0 Td
(dimensional)Tj
5.1704 0 Td
(grid)Tj
1.8482 0 Td
(world)Tj
2.5567 0 Td
(we)Tj
1.3266 0 Td
(can)Tj
1.6271 0 Td
(define)Tj
2.6985 0 Td
(North)Tj
2.6589 0 Td
(=)Tj
/F12 1 Tf
0 Tc
0.7994 0 Td
(h)Tj
/F10 1 Tf
-0.004 Tc
[()]TJ
/F5 1 Tf
(/)Tj
/F10 1 Tf
[()14()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
2.9197 0 Td
[()15()]TJ
/F5 1 Tf
(/)Tj
/F10 1 Tf
[()14()]TJ
/F12 1 Tf
0 Tc
(i)Tj
/F5 1 Tf
-0.004 Tc
2.6588 0 Td
(=)Tj
/F12 1 Tf
0 Tc
0.7994 0 Td
(h)Tj
/F5 1 Tf
-0.004 Tc
(0,)Tj
-36.4589 -1.2983 Td
(1)Tj
/F12 1 Tf
0 Tc
(i)Tj
/F5 1 Tf
-0.004 Tc
1.0828 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.652 0 Td
(cardinal)Tj
3.4696 0 Td
(movement\).)Tj
5.0853 0 Td
(We)Tj
1.6044 0 Td
(can)Tj
1.6271 0 Td
(thus)Tj
1.9332 0 Td
(define)Tj
2.6986 0 Td
(a)Tj
0.6576 0 Td
(transition)Tj
4.1215 0 Td
(function)Tj
3.6283 0 Td
(in)Tj
1.0318 0 Td
(terms)Tj
2.4945 0 Td
(of)Tj
1.0147 0 Td
(cardinal)Tj
-32.1162 -1.2982 Td
(movements)Tj
/F10 1 Tf
4.8756 0 Td
[()]TJ
/F5 1 Tf
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.8425 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.0942 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 282.7842 501.7889 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 284.9385 498.1606 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(|)Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(\))Tj
1.1848 0 Td
(=)Tj
0.7994 0 Td
(Pr\()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 322.1858 501.7889 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 324.2834 498.1606 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(|)Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.1678 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.0999 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
0.9297 0 Td
(and)Tj
1.7291 0 Td
(cast)Tj
1.7405 0 Td
(the)Tj
1.4683 0 Td
(navigation)Tj
4.4447 0 Td
(problem)Tj
3.6113 0 Td
(as)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(learning)Tj
3.5263 0 Td
(of)Tj
-34.6278 -1.3039 Td
(some)Tj
2.3301 0 Td
(function)Tj
3.6283 0 Td
(that)Tj
1.7802 0 Td
(maps)Tj
2.3527 0 Td
(primitive)Tj
3.906 0 Td
(actions)Tj
3.0558 0 Td
(to)Tj
1.0261 0 Td
(cardinal)Tj
3.4753 0 Td
(movements)Tj
/F11 1 Tf
0 Tc
4.8755 0 Td
()Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 470.211 482.6267 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 475.7669 485.1212 cm
BT
/F14 1 Tf
1 TL
0 0 Td
(:)Tj
/F15 1 Tf
0.5499 0 Td
(A)Tj
/F12 1 Tf
1.0715 0 Td
(!)Tj
/F15 1 Tf
1.2755 0 Td
(A)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 512.674 482.6267 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()7( )16()]TJ
1.2094 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 523.6157 485.1212 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(,)Tj
0.4422 0 Td
(which)Tj
2.6532 0 Td
(we)Tj
-35.4555 -1.3039 Td
(assume)Tj
3.1465 0 Td
(to)Tj
1.0261 0 Td
(be)Tj
1.1509 0 Td
(independent)Tj
5.2724 0 Td
(of)Tj
1.0148 0 Td
(location.)Tj
-10.4144 -1.2982 Td
(This)Tj
1.9899 0 Td
(simplifying)Tj
4.7225 0 Td
(assumption)Tj
4.8585 0 Td
(has)Tj
1.542 0 Td
(the)Tj
1.474 0 Td
(benefit)Tj
2.9764 0 Td
(of)Tj
1.0148 0 Td
(providing)Tj
4.1442 0 Td
(a)Tj
0.652 0 Td
(model)Tj
2.7439 0 Td
(of)Tj
1.0148 0 Td
(human)Tj
3.0784 0 Td
(navigation,)Tj
-31.4077 -1.304 Td
(whom)Tj
2.7553 0 Td
(we)Tj
1.3323 0 Td
(assume)Tj
3.1464 0 Td
(understand)Tj
4.7849 0 Td
(spatial)Tj
2.7779 0 Td
(structure.)Tj
4.0478 0 Td
(Note)Tj
2.1884 0 Td
(that)Tj
1.7745 0 Td
(the)Tj
1.474 0 Td
(function)Tj
3.6283 0 Td
(mapping)Tj
3.787 0 Td
(motor)Tj
2.7212 0 Td
(actions)Tj
-34.418 -1.2982 Td
(onto)Tj
2.0807 0 Td
(cardinal)Tj
3.4695 0 Td
(movements)Tj
4.8756 0 Td
(can)Tj
1.6271 0 Td
(depend)Tj
3.1918 0 Td
(on)Tj
1.2755 0 Td
(environmental)Tj
6.1115 0 Td
(conditions,)Tj
4.6998 0 Td
(and)Tj
1.7291 0 Td
(thus,)Tj
2.16 0 Td
(context)Tj
3.1861 0 Td
(\(for)Tj
-34.4067 -1.2983 Td
(example,)Tj
3.7758 0 Td
(wind)Tj
2.245 0 Td
(condition)Tj
4.1159 0 Td
(can)Tj
1.627 0 Td
(change)Tj
3.0388 0 Td
(the)Tj
1.474 0 Td
(relationship)Tj
4.9889 0 Td
(between)Tj
3.5263 0 Td
(primitive)Tj
3.9061 0 Td
(actions)Tj
3.0614 0 Td
(and)Tj
1.729 0 Td
(move-)Tj
-33.4882 -1.2982 Td
(ments)Tj
2.6703 0 Td
(in)Tj
1.0374 0 Td
(space)Tj
2.3755 0 Td
(for)Tj
1.3889 0 Td
(an)Tj
1.2019 0 Td
(aerial)Tj
2.3981 0 Td
(drone\).)Tj
3.1634 0 Td
(A)Tj
0.9015 0 Td
(similar)Tj
2.9876 0 Td
(mapping)Tj
3.7871 0 Td
(between)Tj
3.532 0 Td
(arbitrary)Tj
3.7247 0 Td
(button)Tj
2.9083 0 Td
(presses)Tj
3.0386 0 Td
(and)Tj
-35.1153 -1.304 Td
(movements)Tj
4.8756 0 Td
(in)Tj
1.0375 0 Td
(the)Tj
1.4683 0 Td
(finger)Tj
2.9764 0 Td
(sailing)Tj
3.1974 0 Td
(task)Tj
1.8142 0 Td
(has)Tj
1.542 0 Td
(been)Tj
2.1203 0 Td
(used)Tj
2.058 0 Td
(to)Tj
1.0261 0 Td
(provided)Tj
3.8154 0 Td
(evidence)Tj
3.7134 0 Td
(for)Tj
1.3889 0 Td
(model-based)Tj
-31.0335 -1.2982 Td
(action)Tj
2.6986 0 Td
(planning)Tj
3.7927 0 Td
(in)Tj
1.0375 0 Td
(human)Tj
3.0784 0 Td
(subjects)Tj
3.3789 0 Td
([)Tj
0.83 0.64 0.02 0 k
(14)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.7348 0 Td
(15)Tj
0 g
(].)Tj
1.7348 0 Td
(Similarly,)Tj
4.0308 0 Td
(we)Tj
1.3266 0 Td
(can)Tj
1.6271 0 Td
(express)Tj
3.1408 0 Td
(the)Tj
1.4683 0 Td
(reward)Tj
3.0331 0 Td
(function)Tj
3.6282 0 Td
(in)Tj
-35.7106 -1.2983 Td
(terms)Tj
2.4945 0 Td
(of)Tj
1.0148 0 Td
(cardinal)Tj
3.4696 0 Td
(movements)Tj
4.8756 0 Td
(based)Tj
2.4717 0 Td
(on)Tj
1.2756 0 Td
(a)Tj
0.6577 0 Td
(location)Tj
3.4525 0 Td
(in)Tj
1.0318 0 Td
(space,)Tj
/F10 1 Tf
2.6079 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 439.4267 366.4062 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 442.2047 368.107 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2472 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.2132 0 Td
(=)Tj
0.7994 0 Td
(Pr\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(|)Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
2.8006 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.0998 0 Td
[()]TJ
/F5 1 Tf
(\).)Tj
1.1565 0 Td
(This)Tj
1.9843 0 Td
(allows)Tj
-34.52 -1.3039 Td
(us)Tj
1.1055 0 Td
(to)Tj
1.0205 0 Td
(consider)Tj
3.651 0 Td
(how)Tj
1.9332 0 Td
(the)Tj
1.4683 0 Td
(agent)Tj
2.3868 0 Td
(receives)Tj
3.3618 0 Td
(reward)Tj
3.0331 0 Td
(as)Tj
1.0091 0 Td
(it)Tj
0.7824 0 Td
(moves)Tj
2.7836 0 Td
(through)Tj
3.4468 0 Td
(coordinate)Tj
4.5241 0 Td
(space)Tj
2.3754 0 Td
(\(as)Tj
1.3549 0 Td
(opposed)Tj
-34.2365 -1.2982 Td
(to)Tj
1.0261 0 Td
(how)Tj
1.9389 0 Td
(it)Tj
0.7824 0 Td
(receives)Tj
3.3675 0 Td
(reward)Tj
3.0331 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.6519 0 Td
(function)Tj
3.6283 0 Td
(of)Tj
1.0205 0 Td
(its)Tj
1.1452 0 Td
(actions\).)Tj
3.6227 0 Td
(Alternatively,)Tj
5.5954 0 Td
(we)Tj
1.3266 0 Td
(can)Tj
1.6271 0 Td
(express)Tj
3.1464 0 Td
(the)Tj
1.4684 0 Td
(reward)Tj
-34.3953 -1.2983 Td
(function)Tj
3.6283 0 Td
(as)Tj
/F10 1 Tf
1.0148 0 Td
[()]TJ
/F5 1 Tf
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.8425 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
6.9998 0 0 6.9998 269.5181 332.7307 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 271.8992 329.1023 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\))Tj
0.5612 0 Td
(or)Tj
1.0942 0 Td
(more)Tj
2.3414 0 Td
(simply)Tj
2.8856 0 Td
(as)Tj
/F10 1 Tf
1.0148 0 Td
[()]TJ
/F5 1 Tf
(\()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
6.9998 0 0 6.9998 364.8755 332.7307 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 367.2566 329.1023 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\).)Tj
0.7823 0 Td
(The)Tj
1.7858 0 Td
(key)Tj
1.5931 0 Td
(assumption)Tj
4.8642 0 Td
(here)Tj
1.9616 0 Td
(is)Tj
0.8504 0 Td
(that)Tj
1.7801 0 Td
(the)Tj
1.4683 0 Td
(reward)Tj
3.0331 0 Td
(func-)Tj
-34.8432 -1.3039 Td
(tion)Tj
1.8426 0 Td
(is)Tj
0.8447 0 Td
(not)Tj
1.576 0 Td
(a)Tj
0.652 0 Td
(function)Tj
3.6283 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(agent's)Tj
2.9651 0 Td
(actions)Tj
3.0613 0 Td
(but)Tj
1.5533 0 Td
(is)Tj
0.8504 0 Td
(a)Tj
0.652 0 Td
(function)Tj
3.6283 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(consequences)Tj
5.6976 0 Td
(of)Tj
1.0148 0 Td
(those)Tj
-32.9327 -1.2982 Td
(actions.)Tj
1.1963 -1.2983 Td
(The)Tj
1.7858 0 Td
(task)Tj
1.8085 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(agent)Tj
2.3924 0 Td
(is)Tj
0.8447 0 Td
(to)Tj
1.0262 0 Td
(generate)Tj
3.6113 0 Td
(a)Tj
0.652 0 Td
(policy)Tj
2.6361 0 Td
(\(a)Tj
0.9921 0 Td
(function)Tj
3.6283 0 Td
(mapping)Tj
3.7927 0 Td
(state)Tj
2.0353 0 Td
(variables)Tj
3.719 0 Td
(to)Tj
1.0205 0 Td
(primitive)Tj
-33.6243 -1.3039 Td
(actions,)Tj
3.2825 0 Td
(for)Tj
1.389 0 Td
(each)Tj
2.0296 0 Td
(context;)Tj
/F17 1 Tf
0 Tc
3.4072 0 Td
(p)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 306.5952 280.7433 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 310.1102 277.0582 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(j)Tj
/F10 1 Tf
[()]TJ
/F14 1 Tf
0.924 0 Td
(:)Tj
/F10 1 Tf
0.55 0 Td
[()]TJ
/F12 1 Tf
0.9637 0 Td
(!)Tj
/F15 1 Tf
1.2813 0 Td
(A)Tj
/F5 1 Tf
-0.004 Tc
(\))Tj
1.3493 0 Td
(that)Tj
1.7801 0 Td
(maximizes)Tj
4.4901 0 Td
(its)Tj
1.1452 0 Td
(expected)Tj
3.7247 0 Td
(future)Tj
2.6532 0 Td
(discounted)Tj
4.6317 0 Td
(reward)Tj
-34.5029 -1.2982 Td
([)Tj
0.83 0.64 0.02 0 k
(16)Tj
0 g
(].)Tj
2.0749 0 Td
(Given)Tj
2.6305 0 Td
(a)Tj
0.652 0 Td
(known)Tj
3.0047 0 Td
(transition)Tj
4.1215 0 Td
(function)Tj
3.6283 0 Td
(and)Tj
1.7291 0 Td
(reward)Tj
3.0331 0 Td
(function,)Tj
3.855 0 Td
(the)Tj
1.4684 0 Td
(optimal)Tj
3.3108 0 Td
(policy)Tj
2.6362 0 Td
(given)Tj
2.3811 0 Td
(this)Tj
-34.5256 -1.2983 Td
(task)Tj
1.8084 0 Td
(can)Tj
1.6271 0 Td
(be)Tj
1.1509 0 Td
(defined)Tj
3.2258 0 Td
(as:)Tj
/F17 1 Tf
0 Tc
-2.8516 -3.3902 Td
(p)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 255.1748 220.8188 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
0 -1.0677 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 258.633 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
0.8787 0 Td
()Tj
0.6576 0 Td
()Tj
/F18 1 Tf
1.0488 0 Td
[()8()8()]TJ
1.5874 0 Td
[()3()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 307.4456 211.1244 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[( )]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 326.948 226.6582 cm
BT
/F19 1 Tf
1 TL
0 0 Td
(X)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 323.2062 206.759 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
/F12 1 Tf
(2)Tj
/F15 1 Tf
(A)Tj
ET
Q
q
1 j
1 J
0 w
5 0 0 5 335.8488 205.2283 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()7( )16()20()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 345.033 217.1905 cm
BT
/F11 1 Tf
1 TL
0 0 Td
()Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 350.9858 214.696 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 353.7637 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[( )]TJ
/F11 1 Tf
(;)Tj
/F10 1 Tf
1.3095 0 Td
[()]TJ
/F12 1 Tf
()Tj
/F19 1 Tf
1.2133 0.9467 Td
(X)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 379.7291 206.5889 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5 0 0 5 382.6771 208.2897 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 384.4913 206.5889 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(2)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 394.9795 217.1905 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 400.9322 214.696 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 403.6535 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F11 1 Tf
0.8787 0 Td
(;)Tj
/F10 1 Tf
0.4365 0 Td
[()]TJ
/F11 1 Tf
(;)Tj
/F10 1 Tf
1.0942 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 432.6236 221.3291 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 434.7779 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 447.2503 214.696 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 450.0283 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 458.759 221.3291 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 460.9133 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
0.6009 0 Td
()Tj
/F17 1 Tf
0.9978 0 Td
(g)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 487.9559 214.696 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 490.6771 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 499.4078 221.3291 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 501.5622 217.1905 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F19 1 Tf
-18.408 1.7121 Td
(")Tj
19.0656 0 Td
(#)Tj
/F12 1 Tf
5.5332 -1.7404 Td
()Tj
/F5 1 Tf
(1)Tj
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
-36.3455 -3.7134 Td
(where)Tj
/F10 1 Tf
2.6475 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 233.1212 178.0724 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 235.8992 179.7732 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(\))Tj
1.3662 0 Td
(is)Tj
0.8504 0 Td
(the)Tj
1.4684 0 Td
(optimal)Tj
3.3108 0 Td
(value)Tj
2.3017 0 Td
(function)Tj
3.6284 0 Td
(is)Tj
0.8503 0 Td
(defined)Tj
3.2258 0 Td
(by)Tj
1.1849 0 Td
(the)Tj
1.4684 0 Td
(Bellman)Tj
3.5149 0 Td
(equation:)Tj
/F10 1 Tf
0 Tc
-20.0238 -3.3902 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 274.0535 143.3763 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 276.8314 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
0.873 0 Td
()Tj
0.6576 0 Td
()Tj
/F18 1 Tf
1.0489 0 Td
[()3()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 309.2598 139.748 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 325.5307 155.3385 cm
BT
/F19 1 Tf
1 TL
0 0 Td
(X)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 326.2677 135.2692 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5 0 0 5 329.2157 136.97 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 331.0299 135.2692 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(2)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 339.874 145.8708 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 345.8267 143.3763 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 348.548 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F11 1 Tf
0.873 0 Td
(;)Tj
/F10 1 Tf
0.4422 0 Td
[()]TJ
/F11 1 Tf
(;)Tj
/F10 1 Tf
1.0942 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 377.5181 150.0094 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 379.6157 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 392.1448 143.3763 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 394.9228 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 403.6535 150.0094 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 405.7511 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
0.6066 0 Td
()Tj
/F17 1 Tf
0.9921 0 Td
(g)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 432.7937 143.3763 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 435.5716 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 444.3023 150.0094 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 446.4 145.8708 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F19 1 Tf
-12.6651 1.7121 Td
(")Tj
13.3227 0 Td
(#)Tj
/F12 1 Tf
0.9751 -1.7121 Td
(8)Tj
/F10 1 Tf
0.9468 0 Td
[()]TJ
/F12 1 Tf
0.771 0 Td
(2)Tj
/F10 1 Tf
0.9354 0 Td
[()]TJ
/F12 1 Tf
7.4211 0 Td
()Tj
/F5 1 Tf
(2)Tj
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
-36.3455 -3.685 Td
(As)Tj
1.2642 0 Td
(the)Tj
1.4683 0 Td
(relationship)Tj
4.989 0 Td
(between)Tj
3.5319 0 Td
(locations)Tj
3.8098 0 Td
(in)Tj
1.0375 0 Td
(space,)Tj
/F10 1 Tf
2.6021 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 392.9385 107.3196 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 395.7165 109.0204 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(,)Tj
0.4478 0 Td
(is)Tj
0.8447 0 Td
(known)Tj
3.0047 0 Td
(to)Tj
1.0262 0 Td
(the)Tj
1.4683 0 Td
(agent,)Tj
2.6192 0 Td
(it)Tj
0.7824 0 Td
(is)Tj
0.8504 0 Td
(sufficient)Tj
3.9117 0 Td
(to)Tj
1.0262 0 Td
(learn)Tj
-35.5518 -1.3039 Td
(the)Tj
1.4683 0 Td
(cardinal)Tj
/F10 1 Tf
3.4696 0 Td
[()6( )12()11()11()12()13()]TJ
3.6453 0 Td
[()-8(\r)12()6()-4()7()4()11()]TJ
3.4753 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 326.0409 94.337 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 328.8188 95.9811 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[( )]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2755 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.2133 0 Td
(and)Tj
/F10 1 Tf
1.7291 0 Td
[()20()-5()3( )16()20()]TJ
2.9763 0 Td
[()-8(\r)12()6()-4()7()4()11()]TJ
3.4753 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 441.411 94.337 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 444.1889 95.9811 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2529 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.2075 0 Td
(to)Tj
1.0261 0 Td
(determine)Tj
4.3257 0 Td
(an)Tj
1.2019 0 Td
(optimal)Tj
-33.4315 -1.2982 Td
(policy.)Tj
ET
Q
q
1 j
1 J
0 w
576 737.1 m
36 737.1 l
36 737.6 l
576 737.6 l
f*
36 741.2598 169.285 23.6976 re
W* n
q
169.2283 0 0 23.6409 36 741.3165 cm
q
/I0 Do
Q
Q
Q
q
0 0 612 792 re
W* n
1 j
1 J
0 w
7.9999 0 0 7.9999 404.844 745.7952 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(Composit)Tj
4.1527 0 Td
(ional)Tj
2.289 0 Td
(clustering)Tj
4.415 0 Td
(in)Tj
0.978 0 Td
(task)Tj
2.0268 0 Td
(structure)Tj
4.0465 0 Td
(learning)Tj
ET
Q
q
1 j
1 J
0 w
36 48.0002 m
576 48.0002 l
576 47.5002 l
36 47.5002 l
f*
0.83 0.64 0.02 0 k
142.5827 34.9228 m
295.8236 34.9228 l
h
f*
0 g
7.9999 0 0 7.9999 36 36 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(PLOS)Tj
2.8559 0 Td
(Computationa)Tj
6.1229 0 Td
(l)Tj
0.4322 0 Td
(Biology)Tj
3.4371 0 Td
(|)Tj
0.83 0.64 0.02 0 k
0.4748 0 Td
(https:/)Tj
2.6788 0 Td
(/doi.org/10.13)Tj
6.0094 0 Td
(71/journal.p)Tj
5.1166 0 Td
(cbi.1006116)Tj
0 g
6.3497 0 Td
(April)Tj
2.1756 0 Td
(19,)Tj
1.5874 0 Td
(2018)Tj
27.9002 0 Td
(4)Tj
0.7654 0 Td
(/)Tj
ET
endstream
endobj
71 0 obj
<>stream
endstream
endobj
72 0 obj
<>stream
endstream
endobj
73 0 obj
<>stream
endstream
endobj
74 0 obj
<>stream
endstream
endobj
75 0 obj
<>stream
BT
66.402 0 Td
(25)Tj
ET
Q
endstream
endobj
76 0 obj
<>/XObject<>>>/CropBox[0 0 612 792]/MediaBox[0 0 612 792]/Parent 12 0 R/Annots 79 0 R/Contents 80 0 R/TrimBox[0 0 612 792]>>
endobj
79 0 obj
[81 0 R 82 0 R 83 0 R 84 0 R 85 0 R 86 0 R 87 0 R 88 0 R 89 0 R]
endobj
81 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref007)>>
endobj
82 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref002)>>
endobj
83 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref003)>>
endobj
84 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref004)>>
endobj
85 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref017)>>
endobj
86 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref018)>>
endobj
87 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref004)>>
endobj
88 0 obj
<>/Border[0 0 0]/Dest(Rpcbi.1006116.ref019)>>
endobj
89 0 obj
<>/Border[0 0 0]/A 90 0 R>>
endobj
90 0 obj
<>
endobj
80 0 obj
[91 0 R 92 0 R 93 0 R 94 0 R 95 0 R 96 0 R 97 0 R 98 0 R 99 0 R 100 0 R 101 0 R 102 0 R]
endobj
91 0 obj
<>stream
q
0.83 0.64 0.02 0 k
532.8 511.3701 m
537.5055 511.3701 l
h
f*
461.7071 498.3874 m
466.4693 498.3874 l
h
f*
289.1339 485.348 m
293.8394 485.348 l
h
f*
298.3181 485.348 m
303.0803 485.348 l
h
f*
402.8598 485.348 m
412.3843 485.348 l
h
f*
416.8063 485.348 m
426.3307 485.348 l
h
f*
393.6189 420.378 m
398.3811 420.378 l
h
f*
393.8457 407.3386 m
403.3701 407.3386 l
h
f*
0 g
1 j
1 J
0 w
10 0 0 10 211.9748 707.4141 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(While)Tj
2.6532 0 Td
(the)Tj
1.4683 0 Td
(optimal)Tj
3.3108 0 Td
(policy)Tj
2.6362 0 Td
(is)Tj
0.8448 0 Td
(dependent)Tj
4.4617 0 Td
(on)Tj
1.2756 0 Td
(both)Tj
2.0579 0 Td
(the)Tj
1.4683 0 Td
(mapping)Tj
3.7928 0 Td
(function)Tj
3.6283 0 Td
(and)Tj
1.7291 0 Td
(reward)Tj
3.0331 0 Td
(function,)Tj
-33.5563 -1.3039 Td
(crucially,)Tj
3.838 0 Td
(the)Tj
1.4684 0 Td
(optimal)Tj
3.3108 0 Td
(value)Tj
2.3074 0 Td
(function)Tj
3.6283 0 Td
(is)Tj
0.8447 0 Td
(not:)Tj
1.8029 0 Td
(it)Tj
0.7823 0 Td
(is)Tj
0.8504 0 Td
(dependent)Tj
4.456 0 Td
(only)Tj
1.9786 0 Td
(on)Tj
1.2756 0 Td
(the)Tj
1.4683 0 Td
(reward)Tj
3.0331 0 Td
(function)Tj
3.6283 0 Td
(\(and)Tj
-34.6731 -1.2982 Td
(the)Tj
1.4683 0 Td
(known)Tj
3.0047 0 Td
(transition)Tj
4.1215 0 Td
(function)Tj
/F10 1 Tf
3.6284 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 328.1385 679.748 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 330.9165 681.3921 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\).)Tj
0.788 0 Td
(Consequently,)Tj
5.9527 0 Td
(an)Tj
1.2019 0 Td
(agent)Tj
2.3924 0 Td
(can)Tj
1.6214 0 Td
(determine)Tj
4.3257 0 Td
(an)Tj
1.2018 0 Td
(optimal)Tj
3.3109 0 Td
(policy)Tj
2.6362 0 Td
(as)Tj
-36.5213 -1.2982 Td
(a)Tj
0.652 0 Td
(function)Tj
3.6283 0 Td
(of)Tj
1.0148 0 Td
(movements)Tj
4.8756 0 Td
(through)Tj
3.4468 0 Td
(space:)Tj
/F17 1 Tf
0 Tc
-5.6465 -2.846 Td
(p)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 285.222 643.5779 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
0 -1.0677 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 288.737 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
0.873 0 Td
()Tj
0.6633 0 Td
()Tj
/F18 1 Tf
1.0488 0 Td
[()8()8()]TJ
1.5874 0 Td
[()3()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 337.0393 633.8834 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 353.3102 649.4173 cm
BT
/F19 1 Tf
1 TL
0 0 Td
(X)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 354.0472 629.348 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5 0 0 5 356.9952 631.0488 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 358.8661 629.348 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(2)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 367.6535 639.9496 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 373.6062 637.4551 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 376.3275 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F11 1 Tf
0.8787 0 Td
(;)Tj
/F10 1 Tf
0.4365 0 Td
[()]TJ
/F11 1 Tf
(;)Tj
/F10 1 Tf
1.0942 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 405.2976 644.0881 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 407.4519 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 428.7118 644.0881 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 430.8094 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
0.6066 0 Td
()Tj
/F17 1 Tf
0.9921 0 Td
(g)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 457.8519 637.4551 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 460.5732 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 469.3606 644.0881 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 471.4582 639.9496 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F19 1 Tf
-12.3873 1.7121 Td
(")Tj
13.0449 0 Td
(#)Tj
/F12 1 Tf
8.5436 -1.7121 Td
()Tj
/F5 1 Tf
(3)Tj
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
-36.3455 -3.1407 Td
(This)Tj
1.9842 0 Td
(allows)Tj
2.6986 0 Td
(the)Tj
1.4683 0 Td
(agent)Tj
2.3924 0 Td
(to)Tj
1.0262 0 Td
(learn)Tj
2.245 0 Td
(how)Tj
1.9389 0 Td
(it)Tj
0.7823 0 Td
(can)Tj
1.6271 0 Td
(take)Tj
1.8709 0 Td
(an)Tj
1.2018 0 Td
(action)Tj
2.6986 0 Td
(to)Tj
1.0261 0 Td
(move)Tj
2.4265 0 Td
(through)Tj
3.4411 0 Td
(spacethe)Tj
4.5581 0 Td
(mapping)Tj
-33.3861 -1.2983 Td
(function)Tj
/F10 1 Tf
3.6283 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 241.7952 593.8582 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 244.5732 595.559 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[( )]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2699 0 Td
[()]TJ
/F5 1 Tf
(\)independently)Tj
7.8916 0 Td
(from)Tj
2.2053 0 Td
(the)Tj
1.4683 0 Td
(desirability)Tj
4.6488 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(consequences)Tj
5.6976 0 Td
(of)Tj
1.0148 0 Td
(these)Tj
2.2563 0 Td
(moves)Tj
/F10 1 Tf
-33.3918 -1.3039 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 205.9086 580.8755 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 208.6866 582.5196 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 216.737 586.148 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(0)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 218.8346 582.5196 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\).)Tj
0.788 0 Td
(This)Tj
1.9842 0 Td
(distinction)Tj
4.5354 0 Td
(allows)Tj
2.6986 0 Td
(for)Tj
1.389 0 Td
(compositionality)Tj
6.9391 0 Td
(during)Tj
2.931 0 Td
(generalization,)Tj
6.0945 0 Td
(as)Tj
1.0148 0 Td
(we)Tj
1.3266 0 Td
(will)Tj
1.6611 0 Td
(discuss)Tj
3.05 0 Td
(in)Tj
-36.2944 -1.2982 Td
(the)Tj
1.4683 0 Td
(following)Tj
3.9797 0 Td
(section.)Tj
ET
Q
q
1 j
1 J
0 w
11.9999 0 0 11.9999 200.0125 542.4377 cm
BT
/F20 1 Tf
1 TL
-0.0033 Tc
0 0 Td
(Context)Tj
3.5575 0 Td
(clustering)Tj
4.3606 0 Td
(as)Tj
1.0677 0 Td
(generalization)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 200.0125 525.4299 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(A)Tj
0.9014 0 Td
(common)Tj
3.8494 0 Td
(strategy)Tj
3.3222 0 Td
(to)Tj
1.0261 0 Td
(support)Tj
3.3222 0 Td
(task)Tj
1.8085 0 Td
(generalization)Tj
5.8677 0 Td
(is)Tj
0.8447 0 Td
(to)Tj
1.0261 0 Td
(cluster)Tj
2.8743 0 Td
(contexts)Tj
3.5433 0 Td
(together,)Tj
3.7587 0 Td
(assuming)Tj
-32.1446 -1.2982 Td
(they)Tj
1.9218 0 Td
(share)Tj
2.3414 0 Td
(the)Tj
1.4684 0 Td
(same)Tj
2.2563 0 Td
(task)Tj
1.8085 0 Td
(statistics,)Tj
3.8154 0 Td
(if)Tj
0.7767 0 Td
(doing)Tj
2.5342 0 Td
(so)Tj
1.0885 0 Td
(leads)Tj
2.211 0 Td
(to)Tj
1.0261 0 Td
(an)Tj
1.2019 0 Td
(acceptable)Tj
4.354 0 Td
(degree)Tj
2.8516 0 Td
(of)Tj
1.0148 0 Td
(error)Tj
2.2677 0 Td
([)Tj
0.83 0.64 0.02 0 k
(7)Tj
0 g
(].)Tj
1.5988 0 Td
(This)Tj
-34.5371 -1.2983 Td
(logic)Tj
2.1259 0 Td
(underlies)Tj
3.9175 0 Td
(models)Tj
3.1067 0 Td
(of)Tj
1.0148 0 Td
(animal)Tj
2.9707 0 Td
(Pavlovian)Tj
4.1216 0 Td
(learning)Tj
3.5262 0 Td
(and)Tj
1.7292 0 Td
(transfer)Tj
3.3165 0 Td
([)Tj
0.83 0.64 0.02 0 k
(2)Tj
0 g
(],)Tj
1.6044 0 Td
(human)Tj
3.0727 0 Td
(instrumental)Tj
-30.5062 -1.3039 Td
(learning)Tj
3.5206 0 Td
(and)Tj
1.7347 0 Td
(transfer)Tj
3.3166 0 Td
([)Tj
0.83 0.64 0.02 0 k
(3)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.2585 0 Td
(4)Tj
0 g
(],)Tj
1.2586 0 Td
(and)Tj
1.7348 0 Td
(category)Tj
3.5943 0 Td
(learning)Tj
3.5263 0 Td
([)Tj
0.83 0.64 0.02 0 k
(17)Tj
0 g
(,)Tj
0.83 0.64 0.02 0 k
1.7348 0 Td
(18)Tj
0 g
(].)Tj
1.7404 0 Td
(Clustering)Tj
4.388 0 Td
(models)Tj
3.1068 0 Td
(of)Tj
1.0148 0 Td
(human)Tj
3.0784 0 Td
(gener-)Tj
-35.0076 -1.2983 Td
(alization)Tj
3.6339 0 Td
(typically)Tj
3.5603 0 Td
(rely)Tj
1.7178 0 Td
(on)Tj
1.2756 0 Td
(a)Tj
0.652 0 Td
(non-parametric)Tj
6.5366 0 Td
(Dirichlet)Tj
3.7814 0 Td
(process,)Tj
3.4072 0 Td
(commonly)Tj
4.5468 0 Td
(known)Tj
3.0047 0 Td
(as)Tj
1.0148 0 Td
(the)Tj
1.474 0 Td
(Chi-)Tj
-34.6051 -1.2982 Td
(nese)Tj
1.9729 0 Td
(restaurant)Tj
4.2916 0 Td
(process)Tj
3.1804 0 Td
(\(CRP\),)Tj
2.9707 0 Td
(which)Tj
2.6532 0 Td
(acts)Tj
1.7348 0 Td
(as)Tj
1.0148 0 Td
(a)Tj
0.652 0 Td
(clustering)Tj
4.1555 0 Td
(prior)Tj
2.2507 0 Td
(in)Tj
1.0375 0 Td
(a)Tj
0.6577 0 Td
(Bayesian)Tj
3.719 0 Td
(inference)Tj
3.9401 0 Td
(process.)Tj
-34.2309 -1.3039 Td
(Used)Tj
2.2677 0 Td
(in)Tj
1.0374 0 Td
(this)Tj
1.6725 0 Td
(way,)Tj
2.0182 0 Td
(the)Tj
1.4683 0 Td
(CRP)Tj
2.0637 0 Td
(enforces)Tj
3.5659 0 Td
(popularity-based)Tj
6.9675 0 Td
(clustering)Tj
4.1499 0 Td
(to)Tj
1.0262 0 Td
(partition)Tj
3.7303 0 Td
(observations,)Tj
5.4822 0 Td
(so)Tj
-35.4498 -1.2983 Td
(that)Tj
1.7744 0 Td
(the)Tj
1.474 0 Td
(agent)Tj
2.3868 0 Td
(will)Tj
1.6668 0 Td
(be)Tj
1.1508 0 Td
(most)Tj
2.2054 0 Td
(likely)Tj
2.3527 0 Td
(to)Tj
1.0261 0 Td
(reuse)Tj
2.3244 0 Td
(those)Tj
2.3414 0 Td
(tasks)Tj
2.1657 0 Td
(that)Tj
1.7801 0 Td
(have)Tj
2.058 0 Td
(been)Tj
2.1259 0 Td
(most)Tj
2.2054 0 Td
(popular)Tj
3.3392 0 Td
(across)Tj
2.6815 0 Td
(dispa-)Tj
-35.0586 -1.2983 Td
(rate)Tj
1.7461 0 Td
(contexts)Tj
3.5433 0 Td
(\(as)Tj
1.3549 0 Td
(opposed)Tj
3.583 0 Td
(to)Tj
1.0261 0 Td
(across)Tj
2.6759 0 Td
(experiences;)Tj
5.091 0 Td
([)Tj
0.83 0.64 0.02 0 k
(4)Tj
0 g
(]\),)Tj
1.9446 0 Td
(and)Tj
1.7291 0 Td
(has)Tj
1.542 0 Td
(the)Tj
1.4684 0 Td
(attractive)Tj
3.9231 0 Td
(property)Tj
3.685 0 Td
(of)Tj
1.0148 0 Td
(being)Tj
2.4321 0 Td
(a)Tj
-36.7594 -1.3039 Td
(non-parametric)Tj
6.5309 0 Td
(model)Tj
2.744 0 Td
(that)Tj
1.7801 0 Td
(grows)Tj
2.6079 0 Td
(with)Tj
2.0012 0 Td
(the)Tj
1.4683 0 Td
(data)Tj
1.9106 0 Td
([)Tj
0.83 0.64 0.02 0 k
(19)Tj
0 g
(].)Tj
2.0806 0 Td
(Consequently,)Tj
5.9527 0 Td
(it)Tj
0.788 0 Td
(is)Tj
0.8448 0 Td
(not)Tj
1.576 0 Td
(necessary)Tj
4.0195 0 Td
(to)Tj
1.0262 0 Td
(know)Tj
-35.3308 -1.2983 Td
(the)Tj
1.4683 0 Td
(number)Tj
3.4185 0 Td
(of)Tj
1.0148 0 Td
(partitions)Tj
/F10 1 Tf
4.0876 0 Td
[( )]TJ
0.7086 0 Td
[()11()-9()4()11()-9()]TJ
/F5 1 Tf
2.4151 0 Td
(and)Tj
1.7292 0 Td
(the)Tj
1.474 0 Td
(CRP)Tj
2.0636 0 Td
(will)Tj
1.6611 0 Td
(tend)Tj
2.0182 0 Td
(to)Tj
1.0262 0 Td
(parsimoniously)Tj
6.4062 0 Td
(favor)Tj
2.2791 0 Td
(a)Tj
0.6519 0 Td
(smaller)Tj
-32.4224 -1.2982 Td
(number)Tj
3.4185 0 Td
(of)Tj
1.0148 0 Td
(partitions.)Tj
-3.2371 -1.3039 Td
(As)Tj
1.2585 0 Td
(in)Tj
1.0318 0 Td
(prior)Tj
2.2451 0 Td
(work,)Tj
2.4944 0 Td
(we)Tj
1.321 0 Td
(model)Tj
2.7382 0 Td
(generalization)Tj
5.8564 0 Td
(as)Tj
1.0091 0 Td
(the)Tj
1.4627 0 Td
(process)Tj
3.1747 0 Td
(of)Tj
1.0035 0 Td
(inferring)Tj
3.7644 0 Td
(the)Tj
1.4627 0 Td
(assignment)Tj
4.7395 0 Td
(of)Tj
1.0091 0 Td
(con-)Tj
-35.7673 -1.2983 Td
(texts)Tj
/F10 1 Tf
2.0636 0 Td
[()]TJ
/F5 1 Tf
0.6859 0 Td
(=)Tj
0.7994 0 Td
({)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 242.6456 354.7842 cm
BT
/F5 1 Tf
1 TL
-0.0053 Tc
0 0 Td
(1:)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 251.8299 356.4283 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(})Tj
0.5612 0 Td
(into)Tj
1.8368 0 Td
(clusters)Tj
3.2315 0 Td
(that)Tj
1.7802 0 Td
(share)Tj
2.3357 0 Td
(common)Tj
3.8494 0 Td
(task)Tj
1.8085 0 Td
(statistics.)Tj
3.8154 0 Td
(But)Tj
1.6271 0 Td
(here,)Tj
2.1883 0 Td
(we)Tj
1.3266 0 Td
(decompose)Tj
4.7339 0 Td
(these)Tj
-34.2762 -1.2982 Td
(task)Tj
1.8084 0 Td
(statistics)Tj
3.5829 0 Td
(to)Tj
1.0261 0 Td
(consider)Tj
3.6454 0 Td
(the)Tj
1.4683 0 Td
(possibility)Tj
4.2746 0 Td
(that)Tj
1.7745 0 Td
(that)Tj
1.7802 0 Td
(all)Tj
1.1395 0 Td
(contexts)Tj
/F10 1 Tf
3.5433 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.5896 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8787 0 Td
[()]TJ
/F5 1 Tf
0.6803 0 Td
(share)Tj
2.3357 0 Td
(either)Tj
2.5285 0 Td
(the)Tj
1.4684 0 Td
(same)Tj
2.2563 0 Td
(reward)Tj
-34.7807 -1.2983 Td
(function)Tj
3.6283 0 Td
(and/or)Tj
2.9365 0 Td
(mapping)Tj
3.7871 0 Td
(function,)Tj
3.8551 0 Td
(such)Tj
2.0636 0 Td
(that)Tj
/F10 1 Tf
1.7745 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 386.3622 328.7622 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 389.8771 330.4629 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2472 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.2132 0 Td
(=)Tj
/F10 1 Tf
0.7994 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 428.4283 328.7622 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 431.2062 330.4629 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[()]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2472 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
/F12 1 Tf
0 Tc
1.2132 0 Td
(8)Tj
/F10 1 Tf
-0.004 Tc
0.771 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.5953 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8731 0 Td
[()]TJ
/F5 1 Tf
0.6859 0 Td
(and/or)Tj
/F10 1 Tf
2.9367 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 519.9307 328.7622 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 523.4456 330.4629 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[( )]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
1.2699 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.2132 0 Td
(=)Tj
/F10 1 Tf
0.7993 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 561.77 328.7622 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 564.548 330.4629 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(\()Tj
/F10 1 Tf
[( )]TJ
/F5 1 Tf
(,)Tj
/F10 1 Tf
-36.4533 -1.3039 Td
[()]TJ
/F5 1 Tf
(\))Tj
/F12 1 Tf
0 Tc
1.2133 0 Td
(8)Tj
/F10 1 Tf
-0.004 Tc
0.771 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.5896 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8787 0 Td
[()]TJ
/F5 1 Tf
(.)Tj
0.9128 0 Td
(\(We)Tj
1.9445 0 Td
(return)Tj
2.7609 0 Td
(to)Tj
1.0262 0 Td
(the)Tj
1.474 0 Td
(and/or)Tj
3.719 0 Td
(distinction,)Tj
4.7622 0 Td
(which)Tj
2.6475 0 Td
(affects)Tj
2.7383 0 Td
(whether)Tj
3.4752 0 Td
(clustering)Tj
4.1499 0 Td
(is)Tj
0.8504 0 Td
(indepen-)Tj
-33.9135 -1.2982 Td
(dent)Tj
2.0183 0 Td
(or)Tj
1.0942 0 Td
(joint)Tj
2.0976 0 Td
(across)Tj
2.6815 0 Td
(reward)Tj
3.0331 0 Td
(and)Tj
1.7291 0 Td
(mapping)Tj
3.7871 0 Td
(functions,)Tj
4.2179 0 Td
(in)Tj
1.0318 0 Td
(the)Tj
1.474 0 Td
(following)Tj
3.9742 0 Td
(section\).)Tj
3.6169 0 Td
(Formally,)Tj
4.0536 0 Td
(we)Tj
-34.8093 -1.2983 Td
(define)Tj
2.6986 0 Td
(generalization)Tj
5.8677 0 Td
(as)Tj
1.0148 0 Td
(the)Tj
1.4683 0 Td
(inference)Tj
/F18 1 Tf
0 Tc
0.5839 -1.8538 Td
[()7()]TJ
/F12 1 Tf
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
1.9616 0 Td
(2)Tj
/F10 1 Tf
0.9354 0 Td
[()]TJ
/F12 1 Tf
(j)Tj
/F15 1 Tf
(D)Tj
/F12 1 Tf
()Tj
2.1714 0 Td
(/)Tj
/F18 1 Tf
1.0488 0 Td
[()7()]TJ
/F12 1 Tf
()Tj
/F15 1 Tf
(D)Tj
/F12 1 Tf
(j)Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
()Tj
/F18 1 Tf
[()7()]TJ
/F12 1 Tf
()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
5.1703 0 Td
(2)Tj
/F10 1 Tf
0.9355 0 Td
[()]TJ
/F12 1 Tf
()Tj
12.4893 0 Td
()Tj
/F5 1 Tf
(4)Tj
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
-36.3456 -2.1487 Td
(where)Tj
/F18 1 Tf
0 Tc
2.6476 0 Td
[()7()]TJ
/F12 1 Tf
()Tj
/F15 1 Tf
(D)Tj
/F12 1 Tf
(j)Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
3.4299 0 Td
(is)Tj
0.8447 0 Td
(the)Tj
1.474 0 Td
(likelihood)Tj
4.2349 0 Td
(of)Tj
1.0148 0 Td
(the)Tj
1.4684 0 Td
(observed)Tj
3.7927 0 Td
(data)Tj
/F15 1 Tf
0 Tc
1.9162 0 Td
(D)Tj
/F5 1 Tf
-0.004 Tc
0.9921 0 Td
(given)Tj
2.3811 0 Td
(cluster)Tj
/F10 1 Tf
2.8687 0 Td
[()]TJ
/F5 1 Tf
(,)Tj
0.9127 0 Td
(and)Tj
1.7291 0 Td
(Pr\()Tj
/F10 1 Tf
[()]TJ
/F12 1 Tf
0 Tc
1.8596 0 Td
(2)Tj
/F10 1 Tf
-0.004 Tc
0.8787 0 Td
[()]TJ
/F5 1 Tf
(\))Tj
1.0261 0 Td
(is)Tj
0.8504 0 Td
(a)Tj
0.652 0 Td
(prior)Tj
-34.9737 -1.2983 Td
(over)Tj
1.9729 0 Td
(the)Tj
1.474 0 Td
(clustering)Tj
4.1499 0 Td
(assignment.)Tj
4.972 0 Td
(As)Tj
1.2642 0 Td
(in)Tj
1.0375 0 Td
(previous)Tj
3.651 0 Td
(models)Tj
3.1011 0 Td
(of)Tj
1.0148 0 Td
(generalization,)Tj
6.0944 0 Td
(we)Tj
1.3266 0 Td
(use)Tj
1.5364 0 Td
(the)Tj
1.4683 0 Td
(CRP)Tj
2.0636 0 Td
(as)Tj
1.0148 0 Td
(the)Tj
-36.1415 -1.3039 Td
(cluster)Tj
2.8687 0 Td
(prior.)Tj
2.4831 0 Td
(If)Tj
0.8447 0 Td
(contexts)Tj
3.549 0 Td
({)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 304.5543 223.7669 cm
BT
/F5 1 Tf
1 TL
-0.0053 Tc
0 0 Td
(1:)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 313.7385 225.411 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(})Tj
0.5612 0 Td
(are)Tj
1.4457 0 Td
(clustered)Tj
3.8267 0 Td
(into)Tj
/F10 1 Tf
1.8369 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.9184 0 Td
()Tj
/F10 1 Tf
-0.004 Tc
0.9921 0 Td
[()]TJ
/F5 1 Tf
0.7483 0 Td
(clusters,)Tj
3.4583 0 Td
(then)Tj
2.0182 0 Td
(the)Tj
1.4684 0 Td
(prior)Tj
2.2507 0 Td
(probability)Tj
4.5977 0 Td
(for)Tj
-35.4951 -1.2982 Td
(any)Tj
1.6554 0 Td
(new)Tj
1.8766 0 Td
(context)Tj
/F10 1 Tf
3.1861 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 270.8787 210.7842 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
/F5 1 Tf
(+1)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 284.9385 212.4283 cm
BT
/F11 1 Tf
1 TL
0 0 Td
(=)Tj
/F12 1 Tf
-0.085 0 Td
(2)Tj
/F5 1 Tf
-0.004 Tc
0.8786 0 Td
({)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 299.9622 210.7842 cm
BT
/F5 1 Tf
1 TL
-0.0053 Tc
0 0 Td
(1:)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 309.1464 212.4283 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(})Tj
0.5612 0 Td
(is:)Tj
/F18 1 Tf
0 Tc
-2.2279 -3.719 Td
[()7()]TJ
/F12 1 Tf
()Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 309.3165 172.7433 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
/F12 1 Tf
0.3401 0 Td
()Tj
/F14 1 Tf
(1)Tj
ET
Q
q
1 j
1 J
0 w
10 0 0 10 322.2992 175.2377 cm
BT
/F12 1 Tf
1 TL
0 0 Td
(2)Tj
/F10 1 Tf
0.9297 0 Td
[()]TJ
/F12 1 Tf
(j)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 342.7653 172.7433 cm
BT
/F14 1 Tf
1 TL
0 0 Td
(1:)Tj
/F10 1 Tf
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 351.0992 175.2377 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
0.6576 0 Td
()Tj
ET
Q
q
1 j
1 J
0 w
378.7087 190.0346 m
403.5969 190.0346 l
403.5969 189.6378 l
378.7087 189.6378 l
f*
10 0 0 10 386.022 194.1732 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 392.9952 191.6787 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 378.7086 180.5102 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
/F12 1 Tf
0.9921 0 Td
()Tj
/F17 1 Tf
0.9921 0 Td
(a)Tj
/F18 1 Tf
1.5023 0.6859 Td
[()1()]TJ
/F10 1 Tf
1.0489 0 Td
[()]TJ
/F12 1 Tf
0.7483 0 Td
()Tj
/F10 1 Tf
1.0488 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 448.4976 184.8755 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
378.7087 165.0898 m
403.5969 165.0898 l
403.5969 164.6929 l
378.7087 164.6929 l
f*
10 0 0 10 388.6299 169.2283 cm
BT
/F17 1 Tf
1 TL
0 0 Td
(a)Tj
/F10 1 Tf
-0.9921 -1.3662 Td
[()]TJ
/F12 1 Tf
0.9921 0 Td
()Tj
/F17 1 Tf
0.9921 0 Td
(a)Tj
/F18 1 Tf
1.5023 0.6859 Td
[()1()]TJ
/F10 1 Tf
1.0488 0 Td
[()]TJ
/F12 1 Tf
0.7484 0 Td
()Tj
/F10 1 Tf
1.0488 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
5.9998 0 0 5.9998 448.4976 159.9307 cm
BT
/F10 1 Tf
1 TL
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 454.3937 162.4251 cm
BT
/F12 1 Tf
1 TL
0 0 Td
()Tj
/F14 1 Tf
0.9977 0 Td
(1)Tj
/F19 1 Tf
-9.6206 3.9004 Td
(8)Tj
0 -0.8957 Td
(>)Tj
0 -0.2892 Td
(>)Tj
0 -0.2891 Td
(<)Tj
0 -1.7915 Td
(>)Tj
0 -0.2891 Td
(>)Tj
0 -0.2948 Td
(:)Tj
/F12 1 Tf
19.5305 1.2302 Td
()Tj
/F5 1 Tf
(5)Tj
/F12 1 Tf
()Tj
/F5 1 Tf
-0.004 Tc
-36.3455 -4.0251 Td
(where)Tj
/F10 1 Tf
2.6475 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 233.4614 133.3417 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 239.1307 134.9858 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(is)Tj
0.8503 0 Td
(the)Tj
1.4684 0 Td
(number)Tj
3.4185 0 Td
(of)Tj
1.0148 0 Td
(contexts)Tj
3.5433 0 Td
(associated)Tj
4.2576 0 Td
(with)Tj
1.9956 0 Td
(cluster)Tj
/F10 1 Tf
2.8743 0 Td
[()]TJ
/F5 1 Tf
0.686 0 Td
(and)Tj
/F10 1 Tf
1.7291 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 463.9181 133.3417 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 470.0976 134.9858 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(is)Tj
0.8447 0 Td
(the)Tj
1.4683 0 Td
(number)Tj
3.4186 0 Td
(of)Tj
1.0148 0 Td
(unique)Tj
-33.7547 -1.2982 Td
(clusters)Tj
3.2315 0 Td
(associated)Tj
4.2576 0 Td
(with)Tj
1.9956 0 Td
(the)Tj
1.4683 0 Td
(n)Tj
0.771 0 Td
(observed)Tj
3.7928 0 Td
(contexts.)Tj
3.7757 0 Td
(If)Tj
/F10 1 Tf
0.8447 0 Td
[()]TJ
/F12 1 Tf
0 Tc
0.686 0 Td
()Tj
/F10 1 Tf
-0.004 Tc
0.9921 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 424.5732 120.359 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 428.5417 122.0031 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(,)Tj
0.4422 0 Td
(then)Tj
/F10 1 Tf
2.0182 0 Td
[()]TJ
/F5 1 Tf
0.686 0 Td
(is)Tj
0.8504 0 Td
(a)Tj
0.6519 0 Td
(previously)Tj
4.354 0 Td
(encountered)Tj
-31.8554 -1.2982 Td
(cluster,)Tj
3.0954 0 Td
(whereas)Tj
3.4469 0 Td
(if)Tj
/F10 1 Tf
0.771 0 Td
[()]TJ
/F5 1 Tf
0.686 0 Td
(=)Tj
/F10 1 Tf
0.7994 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
7.4999 0 0 6.6659 294.4629 107.3196 cm
BT
/F10 1 Tf
1 TL
-0.0053 Tc
0 0 Td
[()]TJ
ET
Q
q
1 j
1 J
0 w
10 0 0 10 300.5858 109.0204 cm
BT
/F5 1 Tf
1 TL
-0.004 Tc
0 0 Td
(+)Tj
0.7993 0 Td
(1,)Tj
0.9241 0 Td
(then)Tj
/F10 1 Tf
2.0183 0 Td
[()]TJ
/F5 1 Tf
0.6859 0 Td
(is)Tj
0.8448 0 Td
(a)Tj
0.6519 0 Td
(new)Tj
1.8765 0 Td
(cluster.)Tj
3.1011 0 Td
(The)Tj
1.7802 0 Td
(parameter)Tj
/F21 1 Tf
4.3143 0 Td
()Tj
/F5 1 Tf
0.7653 0 Td
(governs)Tj
3.3562 0 Td
(the)Tj
1.4684 0 Td
(propensity)Tj
-32.6435 -1.3039 Td
(to)Tj
1.0261 0 Td
(assign)Tj
2.6532 0 Td
(a)Tj
0.6577 0 Td
(new)Tj
1.8765 0 Td
(context)Tj
3.1804 0 Td
(to)Tj
1.0261 0 Td
(a)Tj
0.6519 0 Td
(new)Tj
1.8766 0 Td
(cluster,)Tj
3.1011 0 Td
(that)Tj
1.7744 0 Td
(is)Tj
0.8504 0 Td
(to)Tj
1.0262 0 Td
(create)Tj
2.5908 0 Td
(a)Tj
0.6576 0 Td
(new)Tj
1.8766 0 Td
(task.)Tj
2.0352 0 Td
(Higher)Tj
3.0387 0 Td
(values)Tj
2.6703 0 Td
(of)Tj
/F21 1 Tf
1.0148 0 Td
()Tj
/F5 1 Tf
0.7653 0 Td
(lead)Tj
1.8539 0 Td
(to)Tj
-36.2038 -1.2982 Td
(a)Tj
0.652 0 Td
(greater)Tj
3.0103 0 Td
(prior)Tj
2.2507 0 Td
(probability)Tj
4.5977 0 Td
(that)Tj
1.7801 0 Td
(a)Tj
0.652 0 Td
(new)Tj
1.8765 0 Td
(cluster)Tj
2.8687 0 Td
(is)Tj
0.8504 0 Td
(created)Tj
3.1237 0 Td
(and)Tj
1.7291 0 Td
(favors)Tj
2.6362 0 Td
(a)Tj
0.652 0 Td
(more)Tj
2.3414 0 Td
(expanded)Tj
4.0875 0 Td
(task)Tj
1.8085 0 Td
(space)Tj
ET
Q
q
1 j
1 J
0 w
576 737.1 m
36 737.1 l
36 737.6 l
576 737.6 l
f*
36 741.2598 169.285 23.6976 re
W* n
q
169.2283 0 0 23.6409 36 741.3165 cm
q
/I0 Do
Q
Q
Q
q
0 0 612 792 re
W* n
1 j
1 J
0 w
7.9999 0 0 7.9999 404.844 745.7952 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(Composit)Tj
4.1527 0 Td
(ional)Tj
2.289 0 Td
(clustering)Tj
4.415 0 Td
(in)Tj
0.978 0 Td
(task)Tj
2.0268 0 Td
(structure)Tj
4.0465 0 Td
(learning)Tj
ET
Q
q
1 j
1 J
0 w
36 48.0002 m
576 48.0002 l
576 47.5002 l
36 47.5002 l
f*
0.83 0.64 0.02 0 k
142.5827 34.9228 m
295.8236 34.9228 l
h
f*
0 g
7.9999 0 0 7.9999 36 36 cm
BT
/F0 1 Tf
1 TL
-0.005 Tc
0 0 Td
(PLOS)Tj
2.8559 0 Td
(Computationa)Tj
6.1229 0 Td
(l)Tj
0.4322 0 Td
(Biology)Tj
3.4371 0 Td
(|)Tj
0.83 0.64 0.02 0 k
0.4748 0 Td
(https:/)Tj
2.6788 0 Td
(/doi.org/10.13)Tj
6.0094 0 Td
(71/journal.p)Tj
5.1166 0 Td
(cbi.1006116)Tj
0 g
6.3497 0 Td
(April)Tj
2.1756 0 Td
(19,)Tj
1.5874 0 Td
(2018)Tj
27.9002 0 Td
(5)Tj
0.7654 0 Td
(/)Tj
ET
endstream
endobj
92 0 obj
<>stream
endstream
endobj
93 0 obj
<>stream
endstream
endobj
94 0 obj
<>stream
endstream
endobj
95 0 obj
<>stream
endstream
endobj
96 0 obj
<>stream
endstream
endobj
97 0 obj
<>stream
endstream
endobj
98 0 obj
<>stream
endstream
endobj
99 0 obj
<>stream
endstream
endobj
100 0 obj
<>stream
endstream
endobj
101 0 obj
<>stream
endstream
endobj
102 0 obj
<>stream
BT
66.402 0 Td
(25)Tj
ET
Q
endstream
endobj
103 0 obj
<>/XObject<>>>/CropBox[0 0 612 792]/MediaBox[0 0 612 792]/Parent 12 0 R/Annots 105 0 R/Contents 106 0 R/TrimBox[0 0 612 792]>>
endobj
104 0 obj
<>stream
xYUŹ}9Wghl$ *t( 4AQѠ*""TTP@@AEAQ{Q{e:֪5^u5g5o=Us
ꝿz?$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ H@$ >ڶmٺug}VCERwyW_}=[nصkצM^{|oذ cǎ}$ H@$ H@$ H@$ .]ڪUvڵ>vWO~ؿ>oL0boH@Jo~~