diff --git a/matchmaker/assets/simple_mozart_k265_var1.musicxml b/matchmaker/assets/simple_mozart_k265_var1.musicxml
index 56bebfc..9130440 100644
--- a/matchmaker/assets/simple_mozart_k265_var1.musicxml
+++ b/matchmaker/assets/simple_mozart_k265_var1.musicxml
@@ -132,7 +132,7 @@
           <line>4</line>
           </clef>
         </attributes>
-      <note default-x="82.98" default-y="-10">
+      <note id="n1" default-x="82.98" default-y="-10">
         <pitch>
           <step>D</step>
           <octave>5</octave>
@@ -145,7 +145,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="108.93" default-y="-15">
+      <note id="n2" default-x="108.93" default-y="-15">
         <pitch>
           <step>C</step>
           <octave>5</octave>
@@ -158,7 +158,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="134.88" default-y="-20">
+      <note id="n3" default-x="134.88" default-y="-20">
         <pitch>
           <step>B</step>
           <octave>4</octave>
@@ -171,7 +171,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="160.83" default-y="-15">
+      <note id="n4" default-x="160.83" default-y="-15">
         <pitch>
           <step>C</step>
           <octave>5</octave>
@@ -184,7 +184,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="186.79" default-y="-20">
+      <note id="n5" default-x="186.79" default-y="-20">
         <pitch>
           <step>B</step>
           <octave>4</octave>
@@ -197,7 +197,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="212.74" default-y="-15">
+      <note id="n6" default-x="212.74" default-y="-15">
         <pitch>
           <step>C</step>
           <octave>5</octave>
@@ -210,7 +210,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="238.69" default-y="-20">
+      <note id="n7" default-x="238.69" default-y="-20">
         <pitch>
           <step>B</step>
           <octave>4</octave>
@@ -223,7 +223,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="264.65" default-y="-15">
+      <note id="n8" default-x="264.65" default-y="-15">
         <pitch>
           <step>C</step>
           <octave>5</octave>
@@ -239,7 +239,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="82.98" default-y="-130">
+      <note id="n9" default-x="82.98" default-y="-130">
         <pitch>
           <step>C</step>
           <octave>3</octave>
@@ -250,7 +250,7 @@
         <stem>up</stem>
         <staff>2</staff>
         </note>
-      <note default-x="186.79" default-y="-95">
+      <note id="n10" default-x="186.79" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -263,7 +263,7 @@
         </note>
       </measure>
     <measure number="2" width="226.76">
-      <note default-x="12.5" default-y="10">
+      <note id="n11" default-x="12.5" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -276,7 +276,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="38.45" default-y="5">
+      <note id="n12" default-x="38.45" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -289,7 +289,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="67.2" default-y="0">
+      <note id="n13" default-x="67.2" default-y="0">
         <pitch>
           <step>F</step>
           <alter>1</alter>
@@ -304,7 +304,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="93.16" default-y="5">
+      <note id="n14" default-x="93.16" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -317,7 +317,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="119.11" default-y="0">
+      <note id="n15" default-x="119.11" default-y="0">
         <pitch>
           <step>F</step>
           <alter>1</alter>
@@ -331,7 +331,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="145.06" default-y="5">
+      <note id="n16" default-x="145.06" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -344,7 +344,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="171.02" default-y="0">
+      <note id="n17" default-x="171.02" default-y="0">
         <pitch>
           <step>F</step>
           <alter>1</alter>
@@ -358,7 +358,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="196.97" default-y="5">
+      <note id="n18" default-x="196.97" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -374,7 +374,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="12.5" default-y="-85">
+      <note id="n19" default-x="12.5" default-y="-85">
         <pitch>
           <step>E</step>
           <octave>4</octave>
@@ -385,7 +385,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="119.11" default-y="-95">
+      <note id="n20" default-x="119.11" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -398,7 +398,7 @@
         </note>
       </measure>
     <measure number="3" width="230.22">
-      <note default-x="18.76" default-y="5">
+      <note id="n21" default-x="18.76" default-y="5">
         <pitch>
           <step>G</step>
           <alter>1</alter>
@@ -413,7 +413,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="44.71" default-y="10">
+      <note id="n22" default-x="44.71" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -426,7 +426,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="70.66" default-y="20">
+      <note id="n23" default-x="70.66" default-y="20">
         <pitch>
           <step>C</step>
           <octave>6</octave>
@@ -439,7 +439,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="96.62" default-y="15">
+      <note id="n24" default-x="96.62" default-y="15">
         <pitch>
           <step>B</step>
           <octave>5</octave>
@@ -452,7 +452,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="122.57" default-y="25">
+      <note id="n25" default-x="122.57" default-y="25">
         <pitch>
           <step>D</step>
           <octave>6</octave>
@@ -465,7 +465,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="148.52" default-y="20">
+      <note id="n26" default-x="148.52" default-y="20">
         <pitch>
           <step>C</step>
           <octave>6</octave>
@@ -478,7 +478,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="174.48" default-y="15">
+      <note id="n27" default-x="174.48" default-y="15">
         <pitch>
           <step>B</step>
           <octave>5</octave>
@@ -491,7 +491,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="200.43" default-y="10">
+      <note id="n28" default-x="200.43" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -507,7 +507,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="18.76" default-y="-80">
+      <note id="n29" default-x="18.76" default-y="-80">
         <pitch>
           <step>F</step>
           <octave>4</octave>
@@ -518,7 +518,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="122.57" default-y="-95">
+      <note id="n30" default-x="122.57" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -531,7 +531,7 @@
         </note>
       </measure>
     <measure number="4" width="227.14">
-      <note default-x="12.5" default-y="10">
+      <note id="n31" default-x="12.5" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -547,7 +547,7 @@
           <slur type="start" orientation="over" placement="above" number="1"/>
           </notations>
         </note>
-      <note default-x="41.63" default-y="5">
+      <note id="n32" default-x="41.63" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -564,7 +564,7 @@
           <slur type="stop" number="1"/>
           </notations>
         </note>
-      <note default-x="67.58" default-y="30">
+      <note id="n33" default-x="67.58" default-y="30">
         <pitch>
           <step>E</step>
           <octave>6</octave>
@@ -577,7 +577,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="93.54" default-y="25">
+      <note id="n34" default-x="93.54" default-y="25">
         <pitch>
           <step>D</step>
           <octave>6</octave>
@@ -590,7 +590,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="119.49" default-y="20">
+      <note id="n35" default-x="119.49" default-y="20">
         <pitch>
           <step>C</step>
           <octave>6</octave>
@@ -603,7 +603,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="145.44" default-y="15">
+      <note id="n36" default-x="145.44" default-y="15">
         <pitch>
           <step>B</step>
           <octave>5</octave>
@@ -616,7 +616,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="171.4" default-y="10">
+      <note id="n37" default-x="171.4" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -629,7 +629,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="197.35" default-y="5">
+      <note id="n38" default-x="197.35" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -645,7 +645,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="12.5" default-y="-95">
+      <note id="n39" default-x="12.5" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -656,7 +656,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="12.5" default-y="-85">
+      <note id="n40" default-x="12.5" default-y="-85">
         <chord/>
         <pitch>
           <step>E</step>
@@ -668,7 +668,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="119.49" default-y="-125">
+      <note id="n41" default-x="119.49" default-y="-125">
         <rest/>
         <duration>3</duration>
         <voice>5</voice>
@@ -676,7 +676,7 @@
         <dot default-x="135.53" default-y="-120"/>
         <staff>2</staff>
         </note>
-      <note default-x="197.35" default-y="-95">
+      <note id="n42" default-x="197.35" default-y="-95">
         <pitch>
           <step>C</step>
           <alter>1</alter>
@@ -703,7 +703,7 @@
           <staff-distance>65</staff-distance>
           </staff-layout>
         </print>
-      <note default-x="60.86" default-y="5">
+      <note id="n43" default-x="60.86" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -719,7 +719,7 @@
           <slur type="start" orientation="over" placement="above" number="1"/>
           </notations>
         </note>
-      <note default-x="95.12" default-y="0">
+      <note id="n44" default-x="95.12" default-y="0">
         <pitch>
           <step>F</step>
           <octave>5</octave>
@@ -735,7 +735,7 @@
           <slur type="stop" number="1"/>
           </notations>
         </note>
-      <note default-x="129.38" default-y="25">
+      <note id="n45" default-x="129.38" default-y="25">
         <pitch>
           <step>D</step>
           <octave>6</octave>
@@ -748,7 +748,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="163.63" default-y="20">
+      <note id="n46" default-x="163.63" default-y="20">
         <pitch>
           <step>C</step>
           <octave>6</octave>
@@ -761,7 +761,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="197.89" default-y="15">
+      <note id="n47" default-x="197.89" default-y="15">
         <pitch>
           <step>B</step>
           <octave>5</octave>
@@ -774,7 +774,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="232.15" default-y="10">
+      <note id="n48" default-x="232.15" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -787,7 +787,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="266.41" default-y="5">
+      <note id="n49" default-x="266.41" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -800,7 +800,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="300.67" default-y="0">
+      <note id="n50" default-x="300.67" default-y="0">
         <pitch>
           <step>F</step>
           <octave>5</octave>
@@ -816,7 +816,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="60.86" default-y="-90">
+      <note id="n51" default-x="60.86" default-y="-90">
         <pitch>
           <step>D</step>
           <octave>4</octave>
@@ -827,7 +827,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="197.89" default-y="-125">
+      <note id="n52" default-x="197.89" default-y="-125">
         <rest/>
         <duration>3</duration>
         <voice>5</voice>
@@ -835,7 +835,7 @@
         <dot default-x="213.93" default-y="-120"/>
         <staff>2</staff>
         </note>
-      <note default-x="300.67" default-y="-100">
+      <note id="n53" default-x="300.67" default-y="-100">
         <pitch>
           <step>B</step>
           <octave>3</octave>
@@ -848,7 +848,7 @@
         </note>
       </measure>
     <measure number="6" width="294.31">
-      <note default-x="18.44" default-y="0">
+      <note id="n54" default-x="18.44" default-y="0">
         <pitch>
           <step>F</step>
           <octave>5</octave>
@@ -864,7 +864,7 @@
           <slur type="start" orientation="over" placement="above" number="1"/>
           </notations>
         </note>
-      <note default-x="52.7" default-y="-5">
+      <note id="n55" default-x="52.7" default-y="-5">
         <pitch>
           <step>E</step>
           <octave>5</octave>
@@ -880,7 +880,7 @@
           <slur type="stop" number="1"/>
           </notations>
         </note>
-      <note default-x="86.96" default-y="20">
+      <note id="n56" default-x="86.96" default-y="20">
         <pitch>
           <step>C</step>
           <octave>6</octave>
@@ -893,7 +893,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="121.22" default-y="15">
+      <note id="n57" default-x="121.22" default-y="15">
         <pitch>
           <step>B</step>
           <octave>5</octave>
@@ -906,7 +906,7 @@
         <beam number="1">end</beam>
         <beam number="2">end</beam>
         </note>
-      <note default-x="155.48" default-y="10">
+      <note id="n58" default-x="155.48" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -919,7 +919,7 @@
         <beam number="1">begin</beam>
         <beam number="2">begin</beam>
         </note>
-      <note default-x="189.74" default-y="5">
+      <note id="n59" default-x="189.74" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -932,7 +932,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="223.99" default-y="0">
+      <note id="n60" default-x="223.99" default-y="0">
         <pitch>
           <step>F</step>
           <octave>5</octave>
@@ -945,7 +945,7 @@
         <beam number="1">continue</beam>
         <beam number="2">continue</beam>
         </note>
-      <note default-x="258.25" default-y="-5">
+      <note id="n61" default-x="258.25" default-y="-5">
         <pitch>
           <step>E</step>
           <octave>5</octave>
@@ -961,7 +961,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="18.44" default-y="-95">
+      <note id="n62" default-x="18.44" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -973,7 +973,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="155.48" default-y="-125">
+      <note id="n63" default-x="155.48" default-y="-125">
         <rest/>
         <duration>3</duration>
         <voice>5</voice>
@@ -981,7 +981,7 @@
         <dot default-x="171.51" default-y="-120"/>
         <staff>2</staff>
         </note>
-      <note default-x="258.25" default-y="-105">
+      <note id="n64" default-x="258.25" default-y="-105">
         <pitch>
           <step>A</step>
           <octave>3</octave>
@@ -994,7 +994,7 @@
         </note>
       </measure>
     <measure number="7" width="219.86">
-      <note default-x="12.5" default-y="-10">
+      <note id="n65" default-x="12.5" default-y="-10">
         <pitch>
           <step>D</step>
           <octave>5</octave>
@@ -1006,7 +1006,7 @@
         <staff>1</staff>
         <beam number="1">begin</beam>
         </note>
-      <note default-x="63.89" default-y="10">
+      <note id="n66" default-x="63.89" default-y="10">
         <pitch>
           <step>A</step>
           <octave>5</octave>
@@ -1021,7 +1021,7 @@
           <slur type="start" orientation="over" placement="above" number="1"/>
           </notations>
         </note>
-      <note default-x="115.28" default-y="5">
+      <note id="n67" default-x="115.28" default-y="5">
         <pitch>
           <step>G</step>
           <octave>5</octave>
@@ -1036,7 +1036,7 @@
           <slur type="stop" number="1"/>
           </notations>
         </note>
-      <note default-x="166.67" default-y="-20">
+      <note id="n68" default-x="166.67" default-y="-20">
         <pitch>
           <step>B</step>
           <octave>4</octave>
@@ -1051,7 +1051,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="12.5" default-y="-115">
+      <note id="n69" default-x="12.5" default-y="-115">
         <pitch>
           <step>F</step>
           <octave>3</octave>
@@ -1062,7 +1062,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="115.28" default-y="-110">
+      <note id="n70" default-x="115.28" default-y="-110">
         <pitch>
           <step>G</step>
           <octave>3</octave>
@@ -1075,7 +1075,7 @@
         </note>
       </measure>
     <measure number="8" width="177.67">
-      <note default-x="12.5" default-y="-15">
+      <note id="n71" default-x="12.5" default-y="-15">
         <pitch>
           <step>C</step>
           <octave>5</octave>
@@ -1086,7 +1086,7 @@
         <stem>down</stem>
         <staff>1</staff>
         </note>
-      <note default-x="89.58" default-y="-20">
+      <note id="n72" default-x="89.58" default-y="-20">
         <rest/>
         <duration>4</duration>
         <voice>1</voice>
@@ -1096,7 +1096,7 @@
       <backup>
         <duration>8</duration>
         </backup>
-      <note default-x="12.5" default-y="-95">
+      <note id="n73" default-x="12.5" default-y="-95">
         <pitch>
           <step>C</step>
           <octave>4</octave>
@@ -1107,7 +1107,7 @@
         <stem>down</stem>
         <staff>2</staff>
         </note>
-      <note default-x="89.58" default-y="-130">
+      <note id="n74" default-x="89.58" default-y="-130">
         <pitch>
           <step>C</step>
           <octave>3</octave>
diff --git a/matchmaker/dp/oltw_arzt.py b/matchmaker/dp/oltw_arzt.py
index 89d0d5a..a6749cf 100644
--- a/matchmaker/dp/oltw_arzt.py
+++ b/matchmaker/dp/oltw_arzt.py
@@ -98,6 +98,9 @@ def __init__(
         current_position: int = 0,
         frame_rate: int = FRAME_RATE,
         queue: Optional[RECVQueue] = None,
+        state_to_ref_time_map = None,
+        ref_to_state_time_map = None,
+        state_space = None,
         **kwargs,
     ) -> None:
         super().__init__(reference_features=reference_features)
@@ -173,6 +176,9 @@ def __init__(
             "max_latency": 0,
             "min_latency": float("inf"),
         }
+        self.state_to_ref_time_map = state_to_ref_time_map
+        self.ref_to_state_time_map = ref_to_state_time_map
+        self.state_space = state_space #if state_space != None else np.unique(self.reference_features.note_array()["onset_beat"])
 
     @property
     def warping_path(self) -> NDArray[np.int32]:
@@ -289,7 +295,7 @@ def step(self, input_features: NDArray[np.float32]) -> None:
         if self.input_index == 0:
             # enforce the first time step to stay at the
             # initial position
-            self.current_position = min(
+            self.current_position = min( # TODO: Is this necessary?
                 max(self.current_position, min_index),
                 self.current_position,
             )
diff --git a/matchmaker/matchmaker.py b/matchmaker/matchmaker.py
index 1bd66a1..cb21790 100644
--- a/matchmaker/matchmaker.py
+++ b/matchmaker/matchmaker.py
@@ -7,6 +7,7 @@
 import partitura
 from partitura.io.exportmidi import get_ppq
 from partitura.score import Part, merge_parts
+from partitura.musicanalysis.performance_codec import get_time_maps_from_alignment
 
 from matchmaker.dp import OnlineTimeWarpingArzt, OnlineTimeWarpingDixon
 from matchmaker.features.audio import (
@@ -42,7 +43,7 @@
     transfer_from_score_to_predicted_perf,
 )
 from matchmaker.utils.misc import (
-    adjust_tempo_for_performance_audio,
+    adjust_tempo_for_performance_file,
     generate_score_audio,
     get_tempo_from_score,
     is_audio_file,
@@ -77,7 +78,10 @@
         "dixon": {
             "window_size": 10,
         },
-        "arzt": {},
+        "arzt": {
+            "window_size": 5,
+            "start_window_size": 0.25,
+            "step_size" : 5,},
         "audio_outerhmm": {
             "sample_rate": 16000,
             "frame_rate": 50,
@@ -87,6 +91,9 @@
         "arzt": {
             "processor": "pianoroll",
             "piano_range": True,
+            "window_size": 200,
+            "start_window_size": 200,
+            "step_size": 5,
         },
         "dixon": {
             "processor": "pianoroll",
@@ -166,7 +173,7 @@ def __init__(
         #     raise ValueError(f"Invalid input_type {input_type}")
         self.input_type = input_type
         self.feature_type = feature_type
-        self.frame_rate = frame_rate
+        self.frame_rate = frame_rate if input_type == "audio" else 1
         self.sample_rate = sample_rate
         self.hop_length = sample_rate // self.frame_rate
         self.score_part: Optional[Part] = None
@@ -185,7 +192,7 @@ def __init__(
             raise ValueError(f"Invalid method. Available methods: {AVAILABLE_METHODS}")
 
         self.method = method
-        self.config = kwargs[input_type][self.method]
+        self.config = kwargs[self.input_type][self.method]
         self.auto_adjust_tempo = auto_adjust_tempo
 
         # Apply method-specific defaults from config (only if not explicitly provided by caller)
@@ -276,7 +283,7 @@ def __init__(
 
         # setup distance function
         if distance_func is None:
-            distance_func = DEFAULT_DISTANCE_FUNCS[method]
+            distance_func = DEFAULT_DISTANCE_FUNCS[self.method]
         # setup stream device
 
         if self.input_type == "audio":
@@ -299,18 +306,24 @@ def __init__(
         else:
             raise ValueError(f"Invalid input type {self.input_type}")
 
-        use_score_audio = self.input_type == "audio" and method in {"dixon", "arzt"}
-        self.reference_features = self.preprocess_score(use_score_audio)
+        self.reference_features = self.preprocess_score()
 
         if distance_func is None:
             distance_func = DEFAULT_DISTANCE_FUNCS[method]
 
         if method == "arzt":
+            state_to_ref_time_map, ref_to_state_time_map = self.get_time_maps()
             self.score_follower = OnlineTimeWarpingArzt(
                 reference_features=self.reference_features,
                 queue=self.stream.queue,
                 distance_func=distance_func,
                 frame_rate=self.frame_rate,
+                window_size=self.config["window_size"],
+                start_window_size=self.config["start_window_size"],
+                state_to_ref_time_map=state_to_ref_time_map,
+                ref_to_state_time_map=ref_to_state_time_map,
+                step_size=self.config["step_size"],
+                state_space=np.unique(self.score_part.note_array()["onset_beat"])
             )
         elif method == "dixon":
             self.score_follower = OnlineTimeWarpingDixon(
@@ -327,11 +340,6 @@ def __init__(
                 has_insertions=True,
                 piano_range=self.config["piano_range"],
             )
-        elif method == "outerhmm" and self.input_type == "midi":
-            self.score_follower = OuterProductHMM(
-                reference_features=self.reference_features,
-                queue=self.stream.queue,
-            )
         elif method == "pthmm" and self.input_type == "audio":
             self.score_follower = GaussianAudioPitchTempoHMM(
                 reference_features=self.reference_features,
@@ -348,7 +356,6 @@ def __init__(
         elif method == "pthmm" and self.input_type == "midi":
             self.score_follower = PitchHMM(
                 reference_features=self.reference_features,
-                # observation_model=obs_model,
                 queue=self.stream.queue,
                 has_insertions=True,
                 piano_range=self.config["piano_range"],
@@ -361,22 +368,43 @@ def __init__(
         else:
             raise ValueError("Invalid method")
 
-    def preprocess_score(self, use_score_audio: bool = False):
+    def preprocess_score(self):
         """Preprocess score to extract reference features."""
         if self.auto_adjust_tempo and self.performance_file is not None:
-            self.tempo = adjust_tempo_for_performance_audio(
+            self.tempo = adjust_tempo_for_performance_file(
                 self.score_part, self.performance_file, self.tempo
             )
 
-        if use_score_audio:
-            self.score_audio = generate_score_audio(
-                self.score_part, self.tempo, self.sample_rate
-            ).astype(np.float32)
-            reference_features = self.processor(self.score_audio)
-            self.processor.reset()
-            return reference_features
+        if self.method in {"arzt", "dixon"}:
+            self.ppart = partitura.utils.music.performance_from_part(self.score_part, bpm=self.tempo)
+            self.ppart.sustain_pedal_threshold = 127
+            if self.input_type == "audio":
+                self.score_audio = generate_score_audio(
+                    self.score_part, self.tempo, self.sample_rate
+                ).astype(np.float32)
+                reference_features = self.processor(self.score_audio)
+                self.processor.reset()
+                return reference_features
+            else:
+                polling_period = 0.01
+                reference_features = (
+                    partitura.utils.music.compute_pianoroll(
+                        note_info=self.ppart,
+                        time_unit="sec",
+                        time_div=int(np.round(1 / polling_period)),
+                        binary=True,
+                        piano_range=self.config["piano_range"],
+                    )
+                    .toarray()
+                    .T
+                ).astype(np.float32)
+                return reference_features
         else:
             return self.score_part.note_array()
+    
+    def get_time_maps(self):
+        alignment = [{"label" : "match", "score_id" : nid, "performance_id": nid} for nid in self.score_part.note_array()["id"]]
+        return get_time_maps_from_alignment(self.ppart.note_array(), self.score_part.note_array(), alignment)
 
     def _convert_frame_to_beat(self, current_frame: int) -> float:
         """
diff --git a/matchmaker/utils/misc.py b/matchmaker/utils/misc.py
index b8be392..ce58269 100644
--- a/matchmaker/utils/misc.py
+++ b/matchmaker/utils/misc.py
@@ -13,6 +13,7 @@
 from typing import Any, Dict, Iterable, List, Optional, Union
 
 import librosa
+import mido
 import numpy as np
 import partitura
 import scipy
@@ -425,25 +426,28 @@ def get_tempo_at_beat(
     return current_tempo
 
 
-def adjust_tempo_for_performance_audio(
-    score: ScoreLike, performance_audio: Path, default_tempo: int = 120
+def adjust_tempo_for_performance_file(
+    score: ScoreLike, performance_file: Path, default_tempo: int = 120
 ):
     """
-    Adjust the tempo of the score part to match the performance audio.
+    Adjust the tempo of the score part to match the performance file.
     We round up the tempo to the nearest 20 bpm to avoid too much optimization.
 
     Parameters
     ----------
     score : partitura.score.ScoreLike
         The score to adjust the tempo of.
-    performance_audio : Path
-        The performance audio file to adjust the tempo to.
+    performance_file : Path
+        The performance file to adjust the tempo to.
     default_tempo : int
         The default tempo of the score.
     """
     score_midi = partitura.save_score_midi(score, out=None)
     source_length = score_midi.length
-    target_length = librosa.get_duration(path=str(performance_audio))
+    if is_midi_file(performance_file):
+        target_length = mido.MidiFile(performance_file).length
+    else:
+        target_length = librosa.get_duration(path=str(performance_file))
     ratio = target_length / source_length
     rounded_tempo = int(
         (default_tempo / ratio + 19) // 20 * 20