libcm is a C development framework with an emphasis on audio signal processing applications.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

cmProc4.h 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343
  1. #ifndef cmProc4_h
  2. #define cmProc4_h
  3. #ifdef __cplusplus
  4. extern "C" {
  5. #endif
  6. typedef struct
  7. {
  8. unsigned smpIdx; // time tag sample index for val
  9. cmMidiByte_t val; //
  10. bool validFl; //
  11. } cmScFolBufEle_t;
  12. typedef struct
  13. {
  14. unsigned pitch;
  15. unsigned scEvtIdx;
  16. } cmScFolEvt_t;
  17. typedef struct
  18. {
  19. unsigned evtCnt; //
  20. cmScFolEvt_t* evtV; // pitchV[pitchCnt]
  21. unsigned scIdx; // index of the score loc (into cmScoreEvt[]) at this location
  22. int barNumb; // bar number of this location
  23. } cmScFolLoc_t;
  24. typedef struct
  25. {
  26. cmObj obj;
  27. cmReal_t srate; //
  28. cmScH_t scH; // score handle
  29. unsigned bufN; // event buffer count
  30. cmScFolBufEle_t* bufV; // event buffer bufV[bufN] - bufV[bufN-1] newest event, bufV[boi] oldest event
  31. int locN; // count of score locations
  32. cmScFolLoc_t* loc; // score loc[locN]
  33. unsigned sbi; // oldest score window index
  34. unsigned sei; // newest score window index
  35. unsigned msln; // minimum score look ahead count
  36. unsigned mswn; // maximum score window length
  37. unsigned forwardCnt; // count of score loc's to look ahead for a match to the current pitch when the optimal edit-dist alignment does not produce a match for the current pitch
  38. unsigned maxDist; // max. dist allowed to still consider matching
  39. unsigned minVel; // notes < minVel are ignored
  40. bool printFl; // true if pitch tracker reporting should be included
  41. bool noBackFl; // prevent the tracker from going backwards in time
  42. unsigned* edWndMtx;
  43. unsigned missCnt; // current consecutive unmatched notes
  44. unsigned matchCnt; // current consecutive matched notes
  45. unsigned eventIdx; // events since reset
  46. unsigned skipCnt; // notes skipped due to velocity
  47. unsigned ret_idx; // last tracked location
  48. } cmScFol;
  49. cmScFol* cmScFolAlloc( cmCtx* ctx, cmScFol* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  50. cmRC_t cmScFolFree( cmScFol** pp );
  51. cmRC_t cmScFolInit( cmScFol* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  52. cmRC_t cmScFolFinal( cmScFol* p );
  53. // Jump to a score location and reset the internal state of the follower.
  54. cmRC_t cmScFolReset( cmScFol* p, unsigned scoreIndex );
  55. // Give the follower a MIDI performance event. Only MIDI note-on events are acted upon;
  56. // all others are ignored.
  57. unsigned cmScFolExec( cmScFol* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  58. //=======================================================================================================================
  59. typedef struct
  60. {
  61. unsigned pitch;
  62. unsigned scEvtIdx;
  63. bool matchFl;
  64. } cmScTrkEvt_t;
  65. typedef struct
  66. {
  67. unsigned evtCnt; //
  68. cmScTrkEvt_t* evtV; // evtV[evtCnt]
  69. unsigned scIdx; // index of the score event (into cmScoreEvt[]) at this location
  70. int barNumb; // bar number of this location
  71. } cmScTrkLoc_t;
  72. typedef struct
  73. {
  74. cmObj obj;
  75. cmScFol* sfp;
  76. double srate;
  77. cmScH_t scH;
  78. unsigned locN;
  79. cmScTrkLoc_t* loc;
  80. unsigned minVel;
  81. unsigned maxWndCnt;
  82. unsigned minWndLookAhead;
  83. bool printFl;
  84. int curLocIdx;
  85. unsigned evtIndex;
  86. } cmScTrk;
  87. cmScTrk* cmScTrkAlloc( cmCtx* ctx, cmScTrk* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  88. cmRC_t cmScTrkFree( cmScTrk** pp );
  89. cmRC_t cmScTrkInit( cmScTrk* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  90. cmRC_t cmScTrkFinal( cmScTrk* p );
  91. // Jump to a score location and reset the internal state of the follower.
  92. cmRC_t cmScTrkReset( cmScTrk* p, unsigned scoreIndex );
  93. // Give the follower a MIDI performance event. Only MIDI note-on events are acted upon;
  94. // all others are ignored.
  95. unsigned cmScTrkExec( cmScTrk* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  96. //=======================================================================================================================
  97. //
  98. // Simplified string alignment function based on Levenshtein edit distance.
  99. //
  100. enum { kEdMinIdx, kEdSubIdx, kEdDelIdx, kEdInsIdx, kEdCnt };
  101. typedef struct
  102. {
  103. unsigned v[kEdCnt];
  104. bool matchFl;
  105. bool transFl;
  106. } ed_val;
  107. typedef struct ed_path_str
  108. {
  109. unsigned code;
  110. unsigned ri;
  111. unsigned ci;
  112. bool matchFl;
  113. bool transFl;
  114. struct ed_path_str* next;
  115. } ed_path;
  116. /*
  117. Backtracking:
  118. m[rn,cn] is organized to indicate the mutation operations
  119. on s0[0:rn-1] or s1[0:cn-1] during backtracking.
  120. Backtracking begins at cell m[rn-1,cn-1] and proceeds
  121. up and left toward m[0,0]. The action to perform during
  122. backtracking is determined by examinging which values
  123. int m[].v[1:3] match m[].v[0].
  124. Match Next Cell
  125. Index Operation Location
  126. ----- ------------------------ ------------------------
  127. 1 Substitute char s0[ri-1] move diagonally; up-left
  128. 2 Delete char s0[ri-1] move up.
  129. 3 Delete char s1[ci-1] move left.
  130. (same as inserting blank
  131. into after s[ri-1]
  132. Note that more than one value in m[].v[1:3] may match
  133. m[].v[0]. In this case the candidate solution branches
  134. at this point in the candidate selection processes.
  135. */
  136. typedef struct
  137. {
  138. const char* s0; // forms rows of m[] - mutate to match s1 - rn=strlen(s0)
  139. const char* s1; // forms columns of m[] - target string - cn=strlen(s1)
  140. unsigned rn; // length of s0 + 1
  141. unsigned cn; // length of s1 + 1
  142. ed_val* m; // m[rn,cn]
  143. unsigned pn; // rn+cn
  144. ed_path* p_mem; // pmem[ 2*pn ];
  145. ed_path* p_avl; // available path record linked list
  146. ed_path* p_cur; // current path linked list
  147. ed_path* p_opt; // p_opt[pn] current best alignment
  148. double s_opt; // score of the current best alignment
  149. } ed_r;
  150. // print the DP matrix ed_r.m[rn,cn].
  151. void ed_print_mtx( ed_r* r );
  152. // Initialize ed_r.
  153. void ed_init( ed_r* r, const char* s0, const char* s1 );
  154. // Fill in the DP matrix.
  155. void ed_calc_mtx( ed_r* r );
  156. // Traverse the possible alignments in the DP matrix and determine the optimal alignment.
  157. void ed_align( ed_r* r );
  158. // Print the optimal alignment p_opt[]
  159. void ed_print_opt( ed_r* r );
  160. // Free resource allocated by ed_init().
  161. void ed_free(ed_r* r);
  162. // Main test function.
  163. void ed_main();
  164. //=======================================================================================================================
  165. enum
  166. {
  167. kSaMinIdx,
  168. kSaSubIdx, // 'substitute' - may or may not match
  169. kSaDelIdx, // 'delete' - delete a MIDI note
  170. kSaInsIdx, // 'insert' - insert a space in the score
  171. kSaCnt
  172. };
  173. typedef struct
  174. {
  175. unsigned v[kSaCnt];
  176. bool matchFl; // if this is a substitute; is it also a match?
  177. bool transFl; // if this is a substitute; is this the second element in a reversed pair?
  178. } cmScAlignVal_t;
  179. typedef struct cmScAlignPath_str
  180. {
  181. unsigned code;
  182. unsigned ri;
  183. unsigned ci;
  184. bool matchFl;
  185. bool transFl;
  186. unsigned locIdx;
  187. struct cmScAlignPath_str* next;
  188. } cmScAlignPath_t;
  189. typedef struct
  190. {
  191. unsigned pitch;
  192. unsigned scEvtIdx;
  193. bool matchFl;
  194. } cmScAlignScEvt_t;
  195. typedef struct
  196. {
  197. unsigned evtCnt; //
  198. cmScAlignScEvt_t* evtV; // evtV[evtCnt]
  199. unsigned scLocIdx; // scH score location index
  200. int barNumb; // bar number of this location
  201. } cmScAlignLoc_t;
  202. typedef struct
  203. {
  204. unsigned locIdx; // location assoc'd with this MIDI evt (cmInvalidIdx if not a positive-match)
  205. unsigned cbCnt; // count of times this event has been sent via the callback
  206. unsigned mni; // unique identifier for this event since previous call to cmScAlignReset().
  207. unsigned smpIdx; // time stamp of this event
  208. unsigned pitch; // MIDI note pitch
  209. unsigned vel; // " " velocity
  210. } cmScAlignMidiEvt_t;
  211. typedef struct
  212. {
  213. unsigned locIdx; // loc[] sync. location
  214. unsigned smpIdx; //
  215. unsigned mni; // MIDI event unique index
  216. unsigned pitch; // MIDI event pitch which may not match the score event pitch
  217. unsigned vel; // " " velocity
  218. bool matchFl;
  219. bool transFl;
  220. bool foundFl;
  221. } cmScAlignResult_t;
  222. //
  223. typedef void (*cmScAlignCb_t)( void* cbArg, unsigned scLocIdx, unsigned mni, unsigned pitch, unsigned vel );
  224. typedef struct
  225. {
  226. cmObj obj;
  227. cmScAlignCb_t cbFunc; //
  228. void* cbArg; //
  229. cmScH_t scH; //
  230. double srate; //
  231. unsigned locN; // length of loc[]
  232. cmScAlignLoc_t* loc; // loc[locN] score array
  233. unsigned rn; // length of midiBuf[] (mn+1)
  234. unsigned cn; // length of score window (scWndN+1)
  235. unsigned mn; // length of midiBuf[] (rn-1)
  236. cmScAlignMidiEvt_t* midiBuf; // midiBuf[ mn ]
  237. unsigned mbi; // index of first element in midiBuf[] - this is required because the MIDI buf fills from the end to the beginning
  238. unsigned mni; // index of event in midiBuf[p->mn] - increments on each note inserted into midiBuf[] - zeroed by cmScAlignReset().
  239. cmScAlignVal_t* m; // m[rn,cn]
  240. unsigned pn; // rn+cn
  241. cmScAlignPath_t* p_mem; // pmem[ 2*pn ];
  242. cmScAlignPath_t* p_avl; // available path record linked list
  243. cmScAlignPath_t* p_cur; // current path linked list
  244. cmScAlignPath_t* p_opt; // p_opt[pn] current best alignment
  245. double s_opt; // score of the current best alignment
  246. unsigned esi; // loc[] index of latest positive match
  247. unsigned missCnt; // count of consecutive trailing MIDI events without positive matches
  248. unsigned scanCnt;
  249. bool printFl;
  250. unsigned begScanLocIdx; // begin the search at this score locations scWnd[begScanLocIdx:begScanLocIdx+p->cn-1]
  251. unsigned resN; // count of records in res[] == 2*cmScoreEvtCount()
  252. cmScAlignResult_t* res; // res[resN]
  253. unsigned ri; //
  254. int stepCnt; // count of loc[] locations to step ahead/back during a cmScAlignStep() operation.
  255. int maxStepMissCnt; // max. consecutive trailing non-positive matches before a scan takes place.
  256. } cmScAlign;
  257. cmScAlign* cmScAlignAlloc( cmCtx* ctx, cmScAlign* p, cmScAlignCb_t cbFunc, void* cbArg, cmReal_t srate, cmScH_t scH, unsigned midiN, unsigned scWndN );
  258. cmRC_t cmScAlignFree( cmScAlign** pp );
  259. cmRC_t cmScAlignInit( cmScAlign* p, cmScAlignCb_t cbFunc, void* cbArg, cmReal_t srate, cmScH_t scH, unsigned midiN, unsigned scWndN );
  260. cmRC_t cmScAlignFinal( cmScAlign* p );
  261. void cmScAlignReset( cmScAlign* p, unsigned begScanLocIdx );
  262. bool cmScAlignExec( cmScAlign* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  263. bool cmScAlignInputMidi( cmScAlign* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  264. // Scan from p->begScanLocIdx to the end of the score looking
  265. // for the best match to p->midiBuf[].
  266. // Returns the score location index which best matches the
  267. // first note p->midiBuf[]. The score associated
  268. // with this match is stored in s_opt.
  269. unsigned cmScAlignScan( cmScAlign* p, unsigned scanCnt );
  270. // Step forward/back by p->stepCnt from p->esi.
  271. // If more than p->maxStepMissCnt consecutive MIDI events are
  272. // missed then automatically run cmScAlignScan().
  273. bool cmScAlignStep( cmScAlign* p );
  274. unsigned cmScAlignScanToTimeLineEvent( cmScAlign* p, cmTlH_t tlH, cmTlObj_t* top, unsigned endSmpIdx );
  275. // Given a score, a time-line, and a marker on the time line scan the
  276. // entire score looking for the best match between the first 'midiN'
  277. // notes in each marker region and the score.
  278. void cmScAlignScanMarkers( cmRpt_t* rpt, cmTlH_t tlH, cmScH_t scH );
  279. #ifdef __cplusplus
  280. }
  281. #endif
  282. #endif