summaryrefslogtreecommitdiffstats
path: root/pico/lib/picodata.h
diff options
context:
space:
mode:
Diffstat (limited to 'pico/lib/picodata.h')
-rw-r--r--pico/lib/picodata.h643
1 files changed, 643 insertions, 0 deletions
diff --git a/pico/lib/picodata.h b/pico/lib/picodata.h
new file mode 100644
index 0000000..637a3ff
--- /dev/null
+++ b/pico/lib/picodata.h
@@ -0,0 +1,643 @@
+/*
+ * Copyright (C) 2008-2009 SVOX AG, Baslerstr. 30, 8048 Zuerich, Switzerland
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+/**
+ * @file picodata.h
+ *
+ * Copyright (C) 2008-2009 SVOX AG, Baslerstr. 30, 8048 Zuerich, Switzerland
+ * All rights reserved.
+ *
+ * History:
+ * - 2009-04-20 -- initial version
+ *
+ */
+#ifndef PICODATA_H_
+#define PICODATA_H_
+
+#include "picodefs.h"
+#include "picoos.h"
+#include "picotrns.h"
+#include "picokfst.h"
+#include "picorsrc.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+#if 0
+}
+#endif
+
+
+/* ***************************************************************
+ * Constants *
+ *****************************************************************/
+
+#define PICODATA_MAX_ITEMS_PER_PHRASE 30
+
+/**
+ * @addtogroup picodata
+ * <b> Pico Data : Item Format </b>\n
+ *
+ The item header is identical for all item types and PUs. Item types
+ that are not handled by a PU are copied.
+
+ Item Header structure\n
+ ---------------------
+ - Byte Content
+ - 0x00 item type
+ - 0x01 item info 1
+ - 0x02 item info 2
+ - 0x03 item length in bytes (not including the header)
+
+ depending on the item type/info, a specific subheader may follow
+ (included in length)
+*/
+
+/* item header fields (tmp.: use item functions below to acces header fields */
+#define PICODATA_ITEMIND_TYPE 0
+#define PICODATA_ITEMIND_INFO1 1
+#define PICODATA_ITEMIND_INFO2 2
+#define PICODATA_ITEMIND_LEN 3
+
+/* ***************************************************************
+ * CharBuffer *
+ *****************************************************************/
+typedef struct picodata_char_buffer * picodata_CharBuffer;
+
+picodata_CharBuffer picodata_newCharBuffer(picoos_MemoryManager mm,
+ picoos_Common common, picoos_objsize_t size);
+
+void picodata_disposeCharBuffer(picoos_MemoryManager mm,
+ picodata_CharBuffer * this);
+
+/* should not be used for PUs but only for feeding the initial cb */
+pico_status_t picodata_cbPutCh(register picodata_CharBuffer this, picoos_char ch);
+
+/* should not be used for PUs other than first PU in the chain (picotok) */
+picoos_int16 picodata_cbGetCh(register picodata_CharBuffer this);
+
+/* reset cb (as if after newCharBuffer) */
+pico_status_t picodata_cbReset (register picodata_CharBuffer this);
+
+/* ** CharBuffer item functions, cf. below in items section ****/
+
+/* ***************************************************************
+ * items *
+ *****************************************************************/
+
+/* item header size */
+#define PICODATA_ITEM_HEADSIZE 4
+
+typedef struct picodata_itemhead
+{
+ picoos_uint8 type;
+ picoos_uint8 info1;
+ picoos_uint8 info2;
+ picoos_uint8 len;
+} picodata_itemhead_t;
+
+
+/* -------------- System wide defines referred to by items -------- */
+/* ---- These maybe better stored in a knowledge module/resoruce*/
+#define PICODATA_ACC0 '\x30' /* 48 '0' */
+#define PICODATA_ACC1 '\x31' /* 49 '1' */
+#define PICODATA_ACC2 '\x32' /* 50 '2' */
+#define PICODATA_ACC3 '\x33' /* 51 '3' */
+#define PICODATA_ACC4 '\x34' /* 52 '4' */
+
+/* reserved for future use:
+ * user-imposed Part-Of-Speech ids for user lexica and phoneme tags
+ * These values should be applied BEFORE POS-disambiguation. The POS lingware either assigns the same
+ * ids to corresponding internal unique or composed POS or else the POS-D will consider these values
+ * "default" */
+#define PICODATA_POS_XNPR 20
+#define PICODATA_POS_XN 21
+#define PICODATA_POS_XV 22
+#define PICODATA_POS_XA 23
+#define PICODATA_POS_XADV 24
+#define PICODATA_POS_XX 25
+
+/* ------------------------- item types ---------------------------- */
+/* new item types, info1, info2 to be defined during PU development */
+/* make sure this stays in sync with "is_valid_itemtype" function */
+#define PICODATA_ITEM_WSEQ_GRAPH '\x73' /* 115, 's' */
+#define PICODATA_ITEM_TOKEN '\x74' /* 116 't' */
+#define PICODATA_ITEM_WORDGRAPH '\x67' /* 103 'g' */
+#define PICODATA_ITEM_WORDINDEX '\x69' /* 105 'i' */
+#define PICODATA_ITEM_WORDPHON '\x77' /* 119 'w' */
+#define PICODATA_ITEM_SYLLPHON '\x79' /* 121 'y' */
+#define PICODATA_ITEM_BOUND '\x62' /* 98 'b' */
+/* #define PICODATA_ITEM_BOUND_DUR '\x64' */ /* 100 'd' */ /* duration-constrained bound */
+#define PICODATA_ITEM_PUNC '\x70' /* 112 'p' */
+#define PICODATA_ITEM_CMD '\x63' /* 99 'c' */
+#define PICODATA_ITEM_PHONE '\x68' /* 104 'h' */ /*reserved for PAM*/
+#define PICODATA_ITEM_FRAME_PAR '\x6b' /* 107 'k' */ /*reserved for CEP*/
+#define PICODATA_ITEM_FRAME '\x66' /* 102 'f' */ /*reserved for SIG*/
+#define PICODATA_ITEM_OTHER '\x6f' /* 111 'o' */
+#define PICODATA_ITEM_ERR '\x00' /* 0 '^@' */
+
+/* generic iteminfo1 */
+#define PICODATA_ITEMINFO1_ERR '\x00' /* 0 '^@' */ /* error state */
+#define PICODATA_ITEMINFO1_NA '\x01' /* 1 '^A' */ /* not applicable */
+
+/* generic iteminfo2 */
+#define PICODATA_ITEMINFO2_ERR '\x00' /* 0 '^@' */ /* error state */
+#define PICODATA_ITEMINFO2_NA '\x01' /* 1 '^A' */ /* not applicable */
+
+/* ------------------------- PUNC item type ---------------------------- */
+/* iteminfo1 */
+#define PICODATA_ITEMINFO1_PUNC_SENTEND '\x73' /* 115 's' */
+#define PICODATA_ITEMINFO1_PUNC_PHRASEEND '\x70' /* 112 'p' */
+#define PICODATA_ITEMINFO1_PUNC_FLUSH '\x66' /* 102 'f' */
+/* iteminfo2 */
+#define PICODATA_ITEMINFO2_PUNC_SENT_T '\x74' /* 116 't' */
+#define PICODATA_ITEMINFO2_PUNC_SENT_Q '\x71' /* 113 'q' */
+#define PICODATA_ITEMINFO2_PUNC_SENT_E '\x65' /* 101 'e' */
+#define PICODATA_ITEMINFO2_PUNC_PHRASE '\x70' /* 112 'p' */
+#define PICODATA_ITEMINFO2_PUNC_PHRASE_FORCED '\x66' /* 102 'f' */
+/* len for PUNC item is ALWAYS = 0 */
+/* ------------------------- BOUND item type ---------------------------- */
+/* iteminfo1 : phrase strength*/
+#define PICODATA_ITEMINFO1_BOUND_SBEG '\x62' /* 98 'b', at sentence begin */
+#define PICODATA_ITEMINFO1_BOUND_SEND '\x73' /* 115 's', at sentence end */
+#define PICODATA_ITEMINFO1_BOUND_TERM '\x74' /* 116 't', replaces a flush */
+#define PICODATA_ITEMINFO1_BOUND_PHR0 '\x30' /* 48 '0', no break, no item */
+#define PICODATA_ITEMINFO1_BOUND_PHR1 '\x31' /* 49 '1', pri. phrase bound. */
+#define PICODATA_ITEMINFO1_BOUND_PHR2 '\x32' /* 50 '2', short break */
+#define PICODATA_ITEMINFO1_BOUND_PHR3 '\x33' /* 51 '3', sec. phr. bound., no break*/
+/* iteminfo2 : phrase type*/
+#define PICODATA_ITEMINFO2_BOUNDTYPE_P '\x50' /* 80 'P' */
+#define PICODATA_ITEMINFO2_BOUNDTYPE_T '\x54' /* 84 'T' */
+#define PICODATA_ITEMINFO2_BOUNDTYPE_Q '\x51' /* 81 'Q' */
+#define PICODATA_ITEMINFO2_BOUNDTYPE_E '\x45' /* 69 'E' */
+/* len for BOUND item is ALWAYS = 0 */
+/* ------------------------- CMD item type ---------------------------- */
+/* iteminfo1 */
+#define PICODATA_ITEMINFO1_CMD_FLUSH 'f' /* 102 flush command (all PUs)*/
+#define PICODATA_ITEMINFO1_CMD_PLAY 'p' /* 112 play command : PU in info 2 will read items from file-->Filename in item content.*/
+#define PICODATA_ITEMINFO1_CMD_SAVE 's' /* 115 save command : PU in info 2 will save items to file-->Filename in item content.*/
+#define PICODATA_ITEMINFO1_CMD_UNSAVE 'u' /* 117 save command : PU in info 2 will stop saving items to file*/
+#define PICODATA_ITEMINFO1_CMD_PROSDOMAIN 'd' /* 100 prosody domain : domain type in info 2, domain name in item content */
+#define PICODATA_ITEMINFO1_CMD_SPELL 'e' /* 101 spell command : info 2 contains start/stop info,
+ spell type/pause len as little endian uint16 in item content */
+#define PICODATA_ITEMINFO1_CMD_IGNSIG 'i' /* ignore signal command : info 2 contains start/stop info */
+#define PICODATA_ITEMINFO1_CMD_PHONEME 'o' /* phoneme command : info 2 contains start/stop info, phonemes in item content */
+#define PICODATA_ITEMINFO1_CMD_IGNORE 'I' /* ignore text command : info 2 contains start/stop info */
+#define PICODATA_ITEMINFO1_CMD_SIL 'z' /* silence command : info 2 contains type of silence;
+ silence duration as little endian uint16 in item content */
+#define PICODATA_ITEMINFO1_CMD_CONTEXT 'c' /* context command : context name in item content */
+#define PICODATA_ITEMINFO1_CMD_VOICE 'v' /* context command : voice name in item content */
+#define PICODATA_ITEMINFO1_CMD_MARKER 'm' /* marker command : marker name in item content */
+#define PICODATA_ITEMINFO1_CMD_PITCH 'P' /* 80 pitch command : abs/rel info in info 2; pitch level as little endian
+ uint16 in item content; relative value is in promille */
+#define PICODATA_ITEMINFO1_CMD_SPEED 'R' /* 82 speed command : abs/rel info in info 2, speed level as little endian
+ uint16 in item content; elative value is in promille */
+#define PICODATA_ITEMINFO1_CMD_VOLUME 'V' /* 86 volume command : abs/rel info in info 2, volume level as little endian
+ uint16 in item content; relative value is in promille */
+#define PICODATA_ITEMINFO1_CMD_SPEAKER 'S' /* 83 speaker command : abs/rel info in info 2, speaker level as little endian
+ uint16 in item content; relative value is in promille */
+
+/* iteminfo2 for PLAY/SAVE */
+#define PICODATA_ITEMINFO2_CMD_TO_TOK 't' /* CMD+PLAY/SAVE+TOKENISATION*/
+#define PICODATA_ITEMINFO2_CMD_TO_PR 'g' /* CMD+PLAY/SAVE+PREPROC*/
+#define PICODATA_ITEMINFO2_CMD_TO_WA 'w' /* CMD+PLAY/SAVE+WORDANA*/
+#define PICODATA_ITEMINFO2_CMD_TO_SA 'a' /* CMD+PLAY/SAVE+SENTANA*/
+#define PICODATA_ITEMINFO2_CMD_TO_ACPH 'h' /* CMD+PLAY/SAVE+ACCENTUATION&PHRASING*/
+#define PICODATA_ITEMINFO2_CMD_TO_SPHO 'p' /* CMD+PLAY/SAVE+ACCENTUATION&PHRASING*/
+#define PICODATA_ITEMINFO2_CMD_TO_PAM 'q' /* CMD+PLAY/SAVE+PHONETIC-ACOUSTIC MAPPING*/
+#define PICODATA_ITEMINFO2_CMD_TO_CEP 'c' /* CMD+PLAY/SAVE+CEP_SMOOTHER*/
+#define PICODATA_ITEMINFO2_CMD_TO_SIG 's' /* CMD+PLAY/SAVE+SIG_GEN */
+
+#if 0
+#define PICODATA_ITEMINFO2_CMD_TO_FST 'f' /* CMD+PLAY/SAVE+FST for Syll and Phonotactic constraints*/
+#endif
+
+#define PICODATA_ITEMINFO2_CMD_TO_UNKNOWN 255
+
+/* iteminfo2 for start/end commands */
+#define PICODATA_ITEMINFO2_CMD_START 's'
+#define PICODATA_ITEMINFO2_CMD_END 'e'
+
+/* iteminfo2 for speed/pitch/volume commands */
+#define PICODATA_ITEMINFO2_CMD_ABSOLUTE 'a'
+#define PICODATA_ITEMINFO2_CMD_RELATIVE 'r'
+
+/* len for CMD item could be >= 0 */
+/* ------------------------- TOKEN item type ---------------------------- */
+/* iteminfo1: simple token type : */
+#define PICODATA_ITEMINFO1_TOKTYPE_SPACE 'W'
+#define PICODATA_ITEMINFO1_TOKTYPE_LETTERV 'V'
+#define PICODATA_ITEMINFO1_TOKTYPE_LETTER 'L'
+#define PICODATA_ITEMINFO1_TOKTYPE_DIGIT 'D'
+#define PICODATA_ITEMINFO1_TOKTYPE_SEQ 'S'
+#define PICODATA_ITEMINFO1_TOKTYPE_CHAR 'C'
+#define PICODATA_ITEMINFO1_TOKTYPE_BEGIN 'B'
+#define PICODATA_ITEMINFO1_TOKTYPE_END 'E'
+#define PICODATA_ITEMINFO1_TOKTYPE_UNDEFINED 'U'
+/* iteminfo2 : token subtype */
+/* len for WORDTOK item is ALWAYS > 0, if len==0 an error should be raised */
+
+/**
+ * @addtogroup picodata
+ *
+ * ------------------------- WORDGRAPH item type ----------------------------
+ * - iteminfo1 : POS and multi-POS values defined in lingware
+ * - iteminfo2 : not applicable
+ * - len for WORDGRAPH item is ALWAYS > 0, if len==0 an error should be raised
+ * (currently picopr may produce empty WORDGRAPH that is eliminated by picowa)
+ * \n------------------------- WORDINDEX item type ----------------------------
+ * - iteminfo1 : POS and multi-POS values defined in lingware
+ * - iteminfo2 : not applicable
+ * - len for WORDINDEX item is ALWAYS > 0, if len==0 an error should be raised
+ * \n------------------------- WORDPHON item type ----------------------------
+ * - iteminfo1 : POS values defined in lingware
+ * - iteminfo2 : Uses PICODATA_ACC0 .. ACC4
+ * -len WORDPHON item is ALWAYS > 0, if len==0 an error should be raised
+ * \n------------------------- SYLLPHON item type ----------------------------
+ * - iteminfo1 : not applicable
+ * - iteminfo2 : Uses PICODATA_ACC0 .. ACC4
+ * - len for SYLLPHON item is ALWAYS > 0, if len==0 an error should be raised
+ * \n------------------------- PHONE item type (PRODUCED BY PAM)-----------------
+ * - iteminfo1 : phonId : the phonetic identity of the phone
+ * - iteminfo2 : n_S_P_Phone : number of states per phoneme
+ * - len for PHON item is ALWAYS > 0, if len==0 an error should be raised
+ * \n------------------------- FRAME_PAR item type (PRODUCED BY CEP) --------
+ * - iteminfo1 : format (float, fixed)
+ * - iteminfo2 : vector size
+ * - len for FRAME_PAR item is ALWAYS > 0, if len==0 an error should be raised
+ * \n------------------------- FRAME item type (PRODUCED BY SIG) -----------
+ * - iteminfo1 : number of samples per frame
+ * - iteminfo2 : number of bytes per sample
+ * - len for FRAME item is ALWAYS > 0, if len==0 an error should be raised
+ *
+ */
+#define PICODATA_ITEMINFO1_FRAME_PAR_DATA_FORMAT_FIXED '\x78' /* 120 'x' fixed point */
+#define PICODATA_ITEMINFO1_FRAME_PAR_DATA_FORMAT_FLOAT '\x66' /* 102 'f' floating point */
+
+/* ***************************************************************
+ * items: CharBuffer functions *
+ *****************************************************************/
+
+/* gets a single item (head and content) from a CharBuffer in buf;
+ blenmax is the max length (in number of bytes) of buf; blen is
+ set to the number of bytes gotten in buf; return values:
+ PICO_OK <- one item gotten
+ PICO_EOF <- no item available, cb is empty
+ PICO_EXC_BUF_UNDERFLOW <- cb not empty, but no valid item
+ PICO_EXC_BUF_OVERFLOW <- buf not large enough
+*/
+pico_status_t picodata_cbGetItem(register picodata_CharBuffer this,
+ picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picoos_uint16 *blen);
+
+/* gets the speech data (without item head) from a CharBuffer in buf;
+ blenmax is the max length (in number of bytes) of buf; blen is
+ set to the number of bytes gotten in buf; return values:
+ PICO_OK <- speech data of one item gotten
+ PICO_EOF <- no item available, cb is empty
+ PICO_EXC_BUF_UNDERFLOW <- cb not empty, but no valid item
+ PICO_EXC_BUF_OVERFLOW <- buf not large enough
+*/
+pico_status_t picodata_cbGetSpeechData(register picodata_CharBuffer this,
+ picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picoos_uint16 *blen);
+
+/* puts a single item (head and content) to a CharBuffer; clenmax is
+ the max length (in number of bytes) accessible in content; clen is
+ set to the number of bytes put from content; return values:
+ PICO_OK <- one item put
+ PICO_EXC_BUF_UNDERFLOW <- no valid item in buf
+ PICO_EXC_BUF_OVERFLOW <- cb not large enough
+*/
+pico_status_t picodata_cbPutItem(register picodata_CharBuffer this,
+ const picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picoos_uint16 *blen);
+
+/* unsafe, just for measuring purposes */
+picoos_uint8 picodata_cbGetFrontItemType(register picodata_CharBuffer this);
+
+/* ***************************************************************
+ * items: support function *
+ *****************************************************************/
+
+/* checks, whether item of type 'ch' is a valid item type */
+picoos_uint8 is_valid_itemtype(const picoos_uint8 ch);
+
+/* gets from buf a single item, values in head set and item content
+ copied to content; blenmax and clenmax are the max lengths (in
+ number of bytes) accessible in buf and content; clen is set to the
+ number of bytes gotten in content; return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- blenmax problem, or no valid item
+ PICO_EXC_BUF_OVERFLOW <- overflow in content
+*/
+pico_status_t picodata_get_itemparts_nowarn(
+ const picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picodata_itemhead_t *head, picoos_uint8 *content,
+ const picoos_uint16 clenmax, picoos_uint16 *clen);
+
+/* gets from buf a single item, values in head set and item content
+ copied to content; blenmax and clenmax are the max lengths (in
+ number of bytes) accessible in buf and content; clen is set to the
+ number of bytes gotten in content; return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- blenmax problem, or no valid item
+ PICO_EXC_BUF_OVERFLOW <- overflow in content
+*/
+pico_status_t picodata_get_itemparts(
+ const picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picodata_itemhead_t *head, picoos_uint8 *content,
+ const picoos_uint16 clenmax, picoos_uint16 *clen);
+
+/* puts a single item to buf; values in head and content copied to
+ buf; clenmax is the max length (in number of bytes) accessible in
+ content; blenmax is the max length (bytes) accessible in buf; blen
+ is set to the number of bytes put to buf; return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- clenmax problem, or no valid item
+ PICO_EXC_BUF_OVERFLOW <- overflow in buf
+*/
+pico_status_t picodata_put_itemparts(const picodata_itemhead_t *head,
+ const picoos_uint8 *content, const picoos_uint16 clenmax,
+ picoos_uint8 *buf, const picoos_uint16 blenmax, picoos_uint16 *blen);
+
+/* gets from buf info of a single item, values in head are set and
+ content is set to the start of content in buf (not copied!);
+ content is set to NULL if the content length is 0; blenmax is the
+ max lengths (in number of bytes) accessible in buf; return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- blenmax problem, or no valid item
+*/
+pico_status_t picodata_get_iteminfo(
+ picoos_uint8 *buf, const picoos_uint16 blenmax,
+ picodata_itemhead_t *head, picoos_uint8 **content);
+
+/* copies the item in inbuf to outbuf after first checking if there is
+ a valid item in inbuf; inlenmax and outlenmax are the max length
+ (in number of byte) accessible in the buffers); in *numb the total
+ number of bytes copied to outbuf (incl. header) is returned; return
+ values:
+ PICO_OK <- item copied
+ PICO_EXC_BUF_OVERFLOW <- overflow in outbuf
+ PICO_ERR_OTHER <- no valid item in inbuf
+*/
+pico_status_t picodata_copy_item(const picoos_uint8 *inbuf,
+ const picoos_uint16 inlenmax, picoos_uint8 *outbuf,
+ const picoos_uint16 outlenmax, picoos_uint16 *numb);
+
+/* sets the info1 field in the header contained in the item in buf;
+ return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- underflow in buf
+*/
+pico_status_t picodata_set_iteminfo1(picoos_uint8 *buf,
+ const picoos_uint16 blenmax, const picoos_uint8 info);
+
+/* sets the info2 field in the header contained in the item in buf;
+ return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- underflow in buf
+*/
+pico_status_t picodata_set_iteminfo2(picoos_uint8 *buf,
+ const picoos_uint16 blenmax, const picoos_uint8 info);
+
+/* sets the len field in the header contained in the item in buf;
+ return values:
+ PICO_OK <- all ok
+ PICO_EXC_BUF_UNDERFLOW <- underflow in buf
+*/
+pico_status_t picodata_set_itemlen(picoos_uint8 *buf,
+ const picoos_uint16 blenmax, const picoos_uint8 len);
+
+/* check item validity and return TRUE if valid; return FALSE if
+ invalid; ilenmax is the max index to be used in item
+*/
+picoos_uint8 picodata_is_valid_item(const picoos_uint8 *item,
+ const picoos_uint16 ilenmax);
+
+/* return TRUE if head is a valid item head, FALSE otherwise */
+picoos_uint8 picodata_is_valid_itemhead(const picodata_itemhead_t *head);
+
+
+/* ***************************************************************
+ * ProcessingUnit *
+ *****************************************************************/
+/* public */
+
+#define PICODATA_MAX_ITEMSIZE (picoos_uint16) (PICODATA_ITEM_HEADSIZE + 256)
+
+/* different buffer sizes per processing unit */
+#define PICODATA_BUFSIZE_DEFAULT (picoos_uint16) PICODATA_MAX_ITEMSIZE
+#define PICODATA_BUFSIZE_TEXT (picoos_uint16) 1 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_TOK (picoos_uint16) 2 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_PR (picoos_uint16) 2 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_WA (picoos_uint16) 2 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_SA (picoos_uint16) 2 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_ACPH (picoos_uint16) 2 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_SPHO (picoos_uint16) 4 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_PAM (picoos_uint16) 4 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_CEP (picoos_uint16) 16 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_SIG (picoos_uint16) 16 * PICODATA_BUFSIZE_DEFAULT
+#define PICODATA_BUFSIZE_SINK (picoos_uint16) 1 * PICODATA_BUFSIZE_DEFAULT
+
+/* different types of processing units */
+typedef enum picodata_putype {
+ PICODATA_PUTYPE_TEXT, /* text */
+ PICODATA_PUTYPE_TOK, /* tokenizer output */
+ PICODATA_PUTYPE_PR, /* preprocessor output */
+ PICODATA_PUTYPE_WA, /* word analysis */
+ PICODATA_PUTYPE_SA, /* sentence analysis */
+ PICODATA_PUTYPE_ACPH, /* accentuation and phrasing */
+ PICODATA_PUTYPE_SPHO, /* sentence phonology (textana postproc) */
+ PICODATA_PUTYPE_PAM, /* phonetics to acoustics mapper processing unit */
+ PICODATA_PUTYPE_CEP, /* cepstral smoothing processing unit */
+ PICODATA_PUTYPE_SIG, /* signal generation processing unit*/
+ PICODATA_PUTYPE_SINK /* item sink unit*/
+} picodata_putype_t;
+
+picoos_uint16 picodata_get_default_buf_size (picodata_putype_t puType);
+
+/* result values returned from the pu->puStep() methode */
+typedef enum picodata_step_result {
+ PICODATA_PU_ERROR,
+ /* PICODATA_PU_EMPTY, *//* reserved (no internal data to be processed) */
+ PICODATA_PU_IDLE, /* need more input to process internal data */
+ PICODATA_PU_BUSY, /* processing internal data */
+ PICODATA_PU_ATOMIC, /* same as pu_busy, but wants to get next time slot (while in an "atomar" operation) */
+ PICODATA_PU_OUT_FULL /* can't proceed because output is full. (next time slot to be assigned to pu's output's consumer) */
+} picodata_step_result_t;
+
+typedef struct picodata_processing_unit * picodata_ProcessingUnit;
+
+picodata_ProcessingUnit picodata_newProcessingUnit(
+ picoos_MemoryManager mm,
+ picoos_Common common,
+ picodata_CharBuffer cbIn,
+ picodata_CharBuffer cbOut,
+ picorsrc_Voice voice);
+
+void picodata_disposeProcessingUnit(
+ picoos_MemoryManager mm,
+ picodata_ProcessingUnit * this);
+
+picodata_CharBuffer picodata_getCbIn(picodata_ProcessingUnit this);
+picodata_CharBuffer picodata_getCbOut(picodata_ProcessingUnit this);
+pico_status_t picodata_setCbIn(picodata_ProcessingUnit this, picodata_CharBuffer cbIn);
+pico_status_t picodata_setCbOut(picodata_ProcessingUnit this, picodata_CharBuffer cbOut);
+
+/* protected */
+typedef pico_status_t (* picodata_puInitializeMethod) (register picodata_ProcessingUnit this);
+typedef pico_status_t (* picodata_puTerminateMethod) (register picodata_ProcessingUnit this);
+typedef picodata_step_result_t (* picodata_puStepMethod) (register picodata_ProcessingUnit this, picoos_int16 mode, picoos_uint16 * numBytesOutput);
+typedef pico_status_t (* picodata_puSubDeallocateMethod) (register picodata_ProcessingUnit this, picoos_MemoryManager mm);
+
+typedef struct picodata_processing_unit
+{
+ /* public */
+ picodata_puInitializeMethod initialize;
+ picodata_puStepMethod step;
+ picodata_puTerminateMethod terminate;
+ picorsrc_Voice voice;
+
+ /* protected */
+ picoos_Common common;
+ picodata_CharBuffer cbIn, cbOut;
+ picodata_puSubDeallocateMethod subDeallocate;
+ void * subObj;
+
+} picodata_processing_unit_t;
+
+/* currently, only wav input and output is supported */
+#define PICODATA_PUTYPE_TEXT_OUTPUT_EXTENSION (picoos_uchar*)".txt"
+#define PICODATA_PUTYPE_TOK_INPUT_EXTENSION PICODATA_PUTYPE_TEXT_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_TOK_OUTPUT_EXTENSION (picoos_uchar*)".tok"
+#define PICODATA_PUTYPE_PR_INPUT_EXTENSION PICODATA_PUTYPE_TOK_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_PR_OUTPUT_EXTENSION (picoos_uchar*)".pr"
+#define PICODATA_PUTYPE_WA_INPUT_EXTENSION PICODATA_PUTYPE_PR_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_WA_OUTPUT_EXTENSION (picoos_uchar*)".wa"
+#define PICODATA_PUTYPE_SA_INPUT_EXTENSION PICODATA_PUTYPE_WA_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_SA_OUTPUT_EXTENSION (picoos_uchar*)".sa"
+#define PICODATA_PUTYPE_ACPH_INPUT_EXTENSION PICODATA_PUTYPE_SA_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_ACPH_OUTPUT_EXTENSION (picoos_uchar*)".acph"
+#define PICODATA_PUTYPE_SPHO_INPUT_EXTENSION PICODATA_PUTYPE_ACPH_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_SPHO_OUTPUT_EXTENSION (picoos_uchar*)".spho"
+#define PICODATA_PUTYPE_PAM_INPUT_EXTENSION PICODATA_PUTYPE_SPHO_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_PAM_OUTPUT_EXTENSION (picoos_uchar*)".pam"
+#define PICODATA_PUTYPE_CEP_INPUT_EXTENSION PICODATA_PUTYPE_PAM_OUTPUT_EXTENSION
+#define PICODATA_PUTYPE_CEP_OUTPUT_EXTENSION (picoos_uchar*)".cep"
+#define PICODATA_PUTYPE_SIG_INPUT_EXTENSION PICODATA_PUTYPE_CEP_OUTPUT_EXTENSION /*PP 11.7.08*/
+#define PICODATA_PUTYPE_SIG_OUTPUT_EXTENSION (picoos_uchar*)".sig"
+#define PICODATA_PUTYPE_SINK_INPUT_EXTENSION PICODATA_PUTYPE_SIG_OUTPUT_EXTENSION
+
+/*wav input is for play wav files in sig */
+#define PICODATA_PUTYPE_WAV_INPUT_EXTENSION (picoos_uchar*)".wav" /*PP 11.7.08*/
+
+/*wav output is for saving wav (binary) files in sig*/
+#define PICODATA_PUTYPE_WAV_OUTPUT_EXTENSION (picoos_uchar*)".wav" /*PP 14.7.08*/
+
+/* ***************************************************************
+ * auxiliary routines *
+ *****************************************************************/
+
+picoos_uint8 picodata_getPuTypeFromExtension(picoos_uchar * filename, picoos_bool input);
+
+#define PICODATA_XSAMPA (picoos_uchar *)"xsampa"
+#define PICODATA_SAMPA (picoos_uchar *)"sampa"
+#define PICODATA_SVOXPA (picoos_uchar *)"svoxpa"
+
+/*----------------------------------------------------------*/
+/** @brief maps an input phone string to its internal representation
+ *
+ * @param transducer initialized SimpleTransducer
+ * @param xsampa_parser fst converting xsampa char input to xsampa ids
+ * @param svoxpa_parser
+ * @param xsampa2svoxpa_mapper
+ * @param inputPhones input phone string in alphabet 'alphabet'
+ * @param alphabet input alphabet
+ * @retval outputPhoneIds output phone string in internal representation
+ * @param maxOutputPhoneIds
+ * @return PICO_OK=mapping done, PICO_ERR_OTHER:unknown alphabet, unknown phones
+ */
+/*---------------------------------------------------------*/
+pico_status_t picodata_mapPAStrToPAIds(
+ picotrns_SimpleTransducer transducer,
+ picoos_Common common,
+ picokfst_FST xsampa_parser,
+ picokfst_FST svoxpa_parser,
+ picokfst_FST xsampa2svoxpa_mapper,
+ picoos_uchar * inputPhones,
+ picoos_uchar * alphabet,
+ picoos_uint8 * outputPhoneIds,
+ picoos_int32 maxOutputPhoneIds);
+
+/* number of binary digits after the comma for fixed-point calculation */
+#define PICODATA_PRECISION 10
+/* constant 0.5 in PICODATA_PRECISION */
+#define PICODATA_PREC_HALF 512
+
+void picodata_transformDurations(
+ picoos_uint8 frame_duration_exp,
+ picoos_int8 array_length,
+ picoos_uint8 * inout,
+ const picoos_uint16 * weight, /* integer weights */
+ picoos_int16 mintarget, /* minimum target duration in ms */
+ picoos_int16 maxtarget, /* maximum target duration in ms */
+ picoos_int16 facttarget, /* factor to be multiplied with original length to get the target
+ the factor is fixed-point with precision PRECISION, i.e.
+ the factor as float would be facttarget / PRECISION_FACT
+ if factor is 0, only min/max are considered */
+ picoos_int16 * dur_rest /* in/out, rest in ms */
+ );
+
+
+
+/* ***************************************************************
+ * For Debugging only *
+ *****************************************************************/
+
+#if defined (PICO_DEBUG)
+
+/* convert (pretty print) item head 'head' and put output in 'str',
+ strsize is the maximum length of 'str' in bytes */
+picoos_char * picodata_head_to_string(const picodata_itemhead_t *head,
+ picoos_char * str, picoos_uint16 strsize);
+
+/* put 'pref6ch' (max. 6 char prefix) and a pretty print output of
+ 'item' in 'str', strlenmax is the maximum length of 'str' in
+ bytes */
+void picodata_info_item(const picoknow_KnowledgeBase kb,
+ const picoos_uint8 *pref6ch,
+ const picoos_uint8 *item,
+ const picoos_uint16 itemlenmax,
+ const picoos_char *filterfn);
+
+
+#define PICODATA_INFO_ITEM(kb, pref, item, itemlenmax) \
+ PICODBG_INFO_CTX(); \
+ picodata_info_item(kb, pref, item, itemlenmax, (picoos_char *)__FILE__)
+
+
+
+#else
+
+#define PICODATA_INFO_ITEM(kb, pref, item, itemlenmax)
+
+#endif
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif /*PICODATA_H_*/