--- /dev/null
+ GNU GENERAL PUBLIC LICENSE
+ Version 2, June 1991
+
+ Copyright (C) 1989, 1991 Free Software Foundation, Inc.
+ 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+ Preamble
+
+ The licenses for most software are designed to take away your
+freedom to share and change it. By contrast, the GNU General Public
+License is intended to guarantee your freedom to share and change free
+software--to make sure the software is free for all its users. This
+General Public License applies to most of the Free Software
+Foundation's software and to any other program whose authors commit to
+using it. (Some other Free Software Foundation software is covered by
+the GNU Library General Public License instead.) You can apply it to
+your programs, too.
+
+ When we speak of free software, we are referring to freedom, not
+price. Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+this service if you wish), that you receive source code or can get it
+if you want it, that you can change the software or use pieces of it
+in new free programs; and that you know you can do these things.
+
+ To protect your rights, we need to make restrictions that forbid
+anyone to deny you these rights or to ask you to surrender the rights.
+These restrictions translate to certain responsibilities for you if you
+distribute copies of the software, or if you modify it.
+
+ For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must give the recipients all the rights that
+you have. You must make sure that they, too, receive or can get the
+source code. And you must show them these terms so they know their
+rights.
+
+ We protect your rights with two steps: (1) copyright the software, and
+(2) offer you this license which gives you legal permission to copy,
+distribute and/or modify the software.
+
+ Also, for each author's protection and ours, we want to make certain
+that everyone understands that there is no warranty for this free
+software. If the software is modified by someone else and passed on, we
+want its recipients to know that what they have is not the original, so
+that any problems introduced by others will not reflect on the original
+authors' reputations.
+
+ Finally, any free program is threatened constantly by software
+patents. We wish to avoid the danger that redistributors of a free
+program will individually obtain patent licenses, in effect making the
+program proprietary. To prevent this, we have made it clear that any
+patent must be licensed for everyone's free use or not licensed at all.
+
+ The precise terms and conditions for copying, distribution and
+modification follow.
+\f
+ GNU GENERAL PUBLIC LICENSE
+ TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+ 0. This License applies to any program or other work which contains
+a notice placed by the copyright holder saying it may be distributed
+under the terms of this General Public License. The "Program", below,
+refers to any such program or work, and a "work based on the Program"
+means either the Program or any derivative work under copyright law:
+that is to say, a work containing the Program or a portion of it,
+either verbatim or with modifications and/or translated into another
+language. (Hereinafter, translation is included without limitation in
+the term "modification".) Each licensee is addressed as "you".
+
+Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope. The act of
+running the Program is not restricted, and the output from the Program
+is covered only if its contents constitute a work based on the
+Program (independent of having been made by running the Program).
+Whether that is true depends on what the Program does.
+
+ 1. You may copy and distribute verbatim copies of the Program's
+source code as you receive it, in any medium, provided that you
+conspicuously and appropriately publish on each copy an appropriate
+copyright notice and disclaimer of warranty; keep intact all the
+notices that refer to this License and to the absence of any warranty;
+and give any other recipients of the Program a copy of this License
+along with the Program.
+
+You may charge a fee for the physical act of transferring a copy, and
+you may at your option offer warranty protection in exchange for a fee.
+
+ 2. You may modify your copy or copies of the Program or any portion
+of it, thus forming a work based on the Program, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+ a) You must cause the modified files to carry prominent notices
+ stating that you changed the files and the date of any change.
+
+ b) You must cause any work that you distribute or publish, that in
+ whole or in part contains or is derived from the Program or any
+ part thereof, to be licensed as a whole at no charge to all third
+ parties under the terms of this License.
+
+ c) If the modified program normally reads commands interactively
+ when run, you must cause it, when started running for such
+ interactive use in the most ordinary way, to print or display an
+ announcement including an appropriate copyright notice and a
+ notice that there is no warranty (or else, saying that you provide
+ a warranty) and that users may redistribute the program under
+ these conditions, and telling the user how to view a copy of this
+ License. (Exception: if the Program itself is interactive but
+ does not normally print such an announcement, your work based on
+ the Program is not required to print an announcement.)
+\f
+These requirements apply to the modified work as a whole. If
+identifiable sections of that work are not derived from the Program,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works. But when you
+distribute the same sections as part of a whole which is a work based
+on the Program, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Program.
+
+In addition, mere aggregation of another work not based on the Program
+with the Program (or with a work based on the Program) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+ 3. You may copy and distribute the Program (or a work based on it,
+under Section 2) in object code or executable form under the terms of
+Sections 1 and 2 above provided that you also do one of the following:
+
+ a) Accompany it with the complete corresponding machine-readable
+ source code, which must be distributed under the terms of Sections
+ 1 and 2 above on a medium customarily used for software interchange; or,
+
+ b) Accompany it with a written offer, valid for at least three
+ years, to give any third party, for a charge no more than your
+ cost of physically performing source distribution, a complete
+ machine-readable copy of the corresponding source code, to be
+ distributed under the terms of Sections 1 and 2 above on a medium
+ customarily used for software interchange; or,
+
+ c) Accompany it with the information you received as to the offer
+ to distribute corresponding source code. (This alternative is
+ allowed only for noncommercial distribution and only if you
+ received the program in object code or executable form with such
+ an offer, in accord with Subsection b above.)
+
+The source code for a work means the preferred form of the work for
+making modifications to it. For an executable work, complete source
+code means all the source code for all modules it contains, plus any
+associated interface definition files, plus the scripts used to
+control compilation and installation of the executable. However, as a
+special exception, the source code distributed need not include
+anything that is normally distributed (in either source or binary
+form) with the major components (compiler, kernel, and so on) of the
+operating system on which the executable runs, unless that component
+itself accompanies the executable.
+
+If distribution of executable or object code is made by offering
+access to copy from a designated place, then offering equivalent
+access to copy the source code from the same place counts as
+distribution of the source code, even though third parties are not
+compelled to copy the source along with the object code.
+\f
+ 4. You may not copy, modify, sublicense, or distribute the Program
+except as expressly provided under this License. Any attempt
+otherwise to copy, modify, sublicense or distribute the Program is
+void, and will automatically terminate your rights under this License.
+However, parties who have received copies, or rights, from you under
+this License will not have their licenses terminated so long as such
+parties remain in full compliance.
+
+ 5. You are not required to accept this License, since you have not
+signed it. However, nothing else grants you permission to modify or
+distribute the Program or its derivative works. These actions are
+prohibited by law if you do not accept this License. Therefore, by
+modifying or distributing the Program (or any work based on the
+Program), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Program or works based on it.
+
+ 6. Each time you redistribute the Program (or any work based on the
+Program), the recipient automatically receives a license from the
+original licensor to copy, distribute or modify the Program subject to
+these terms and conditions. You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties to
+this License.
+
+ 7. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License. If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Program at all. For example, if a patent
+license would not permit royalty-free redistribution of the Program by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Program.
+
+If any portion of this section is held invalid or unenforceable under
+any particular circumstance, the balance of the section is intended to
+apply and the section as a whole is intended to apply in other
+circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system, which is
+implemented by public license practices. Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+\f
+ 8. If the distribution and/or use of the Program is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Program under this License
+may add an explicit geographical distribution limitation excluding
+those countries, so that distribution is permitted only in or among
+countries not thus excluded. In such case, this License incorporates
+the limitation as if written in the body of this License.
+
+ 9. The Free Software Foundation may publish revised and/or new versions
+of the General Public License from time to time. Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+Each version is given a distinguishing version number. If the Program
+specifies a version number of this License which applies to it and "any
+later version", you have the option of following the terms and conditions
+either of that version or of any later version published by the Free
+Software Foundation. If the Program does not specify a version number of
+this License, you may choose any version ever published by the Free Software
+Foundation.
+
+ 10. If you wish to incorporate parts of the Program into other free
+programs whose distribution conditions are different, write to the author
+to ask for permission. For software which is copyrighted by the Free
+Software Foundation, write to the Free Software Foundation; we sometimes
+make exceptions for this. Our decision will be guided by the two goals
+of preserving the free status of all derivatives of our free software and
+of promoting the sharing and reuse of software generally.
+
+ NO WARRANTY
+
+ 11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY
+FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW. EXCEPT WHEN
+OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES
+PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED
+OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS
+TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU. SHOULD THE
+PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,
+REPAIR OR CORRECTION.
+
+ 12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR
+REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,
+INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING
+OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED
+TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY
+YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER
+PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGES.
+
+ END OF TERMS AND CONDITIONS
+\f
+ How to Apply These Terms to Your New Programs
+
+ If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+ To do so, attach the following notices to the program. It is safest
+to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+ <one line to give the program's name and a brief idea of what it does.>
+ Copyright (C) <year> <name of author>
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation; either version 2 of the License, or
+ (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+
+
+Also add information on how to contact you by electronic and paper mail.
+
+If the program is interactive, make it output a short notice like this
+when it starts in an interactive mode:
+
+ Gnomovision version 69, Copyright (C) year name of author
+ Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+ This is free software, and you are welcome to redistribute it
+ under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License. Of course, the commands you use may
+be called something other than `show w' and `show c'; they could even be
+mouse-clicks or menu items--whatever suits your program.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the program, if
+necessary. Here is a sample; alter the names:
+
+ Yoyodyne, Inc., hereby disclaims all copyright interest in the program
+ `Gnomovision' (which makes passes at compilers) written by James Hacker.
+
+ <signature of Ty Coon>, 1 April 1989
+ Ty Coon, President of Vice
+
+This General Public License does not permit incorporating your program into
+proprietary programs. If your program is a subroutine library, you may
+consider it more useful to permit linking proprietary applications with the
+library. If this is what you want to do, use the GNU Library General
+Public License instead of this License.
--- /dev/null
+README.txt for codec2
+David Rowe
+21 August 2009
+
+Introduction
+------------
+
+codec2 is a open source low bit rate speech codec designed for
+communications quality speech at around 2400 kbit/s. Applications
+include low bandwidth HF/VHF digital radio.
+
+Status
+------
+
+Unquantised encoder and decoder running under Linux/gcc, pitch
+estimator untested.
+
+Quick Start
+-----------
+
+To encode the file raw/hts1a.raw to a set of sinusoidal model
+parameters (src/hts1.mdl) then decode to a raw file src/hts1a_uq:
+
+$ cd src
+$ make
+$ ./sinenc ../raw/hts1a.raw hts1.mdl 300 ../pitch/hts1a.p
+$ ./sinedec ../raw/hts1a.raw hts1.mdl -o hts1a_uq.raw
+$ play -f s -r 8000 -s w ../raw/hts1a.raw
+$ play -f s -r 8000 -s w hts1a_uq.raw
+
+Plan
+----
+
+[X] Milestone 0 - Project kick off
+[X] Milestone 1 - Baseline unquantised codec running under Linux/gcc
+[ ] Milestone 2 - Spectral amplitudes quantised
+[ ] Milestone 3 - Prototype 2400 bit/s codec
+
+Directories
+-----------
+
+src - C source code
+octave - Matlab/Octave scripts
+pitch - pitch estimator output files
+raw - speech files in raw format (16 bits signed linear)
+unittest - Unit test source code
+wav - speech files in wave file format
+
+References
+----------
+
+[1] Introductory Blog Post:
+ http://www.rowetel.com/blog/?p=128
+
+[2] Bruce Parens introducing the project:
+ http://codec2.org/
+
+[3] Davids Thesis, used for baseline algorithm:
+ http://www.itr.unisa.edu.au/~steven/thesis/dgr.pdf
+
--- /dev/null
+TODO for codec2
+---------------
+
+[X] Convert files from DOS to Unix
+[X] Get sinenc and sinedec to build and run under gcc
+[ ] refactor
+ [ ] each source file has it's own header
+ [ ] no globals
+ [ ] Consistent file headers
+ [X] GPL2 notice in each file
+[ ] Replace Numerical Recipes in C (NRC) four1.c and four1.h with Gnu
+ Science Lib (GSL) SL FFT as NRC code has restrictive licencing
+[ ] change speech files from raw 16 bit files to wave files
\ No newline at end of file
--- /dev/null
+111.627907\r
+97.959183\r
+97.959183\r
+97.959183\r
+87.272736\r
+78.048775\r
+112.280701\r
+120.000008\r
+61.538464\r
+68.817207\r
+84.210526\r
+90.140846\r
+90.140846\r
+90.140846\r
+101.587303\r
+80.000000\r
+72.727272\r
+95.522392\r
+90.140846\r
+90.140846\r
+101.587303\r
+90.140846\r
+85.333336\r
+86.486488\r
+91.428574\r
+91.428574\r
+91.428574\r
+91.428574\r
+91.428574\r
+90.140846\r
+86.486488\r
+86.486488\r
+85.333336\r
+85.333336\r
+85.333336\r
+81.012657\r
+74.418610\r
+71.111115\r
+71.111115\r
+71.111115\r
+71.111115\r
+68.085106\r
+68.085106\r
+67.368423\r
+67.368423\r
+70.329674\r
+70.329674\r
+70.329674\r
+71.111115\r
+74.418610\r
+74.418610\r
+75.294121\r
+79.012352\r
+85.333336\r
+96.969704\r
+111.627907\r
+111.627907\r
+120.000008\r
+111.627907\r
+104.347832\r
+104.347832\r
+97.959183\r
+104.347832\r
+104.347832\r
+104.347832\r
+104.347832\r
+104.347832\r
+104.347832\r
+104.347832\r
+104.347832\r
+97.959183\r
+97.959183\r
+112.280701\r
+112.280701\r
+96.969704\r
+96.969704\r
+96.969704\r
+110.344841\r
+104.347832\r
+97.959183\r
+97.959183\r
+104.347832\r
+97.959183\r
+104.347832\r
+120.000008\r
+104.347832\r
+120.000008\r
+120.000008\r
+97.959183\r
+83.116882\r
+75.294121\r
+71.910118\r
+71.910110\r
+71.910110\r
+71.910110\r
+75.294121\r
+76.190483\r
+80.000008\r
+80.000008\r
+84.210526\r
+85.333336\r
+90.140846\r
+101.587303\r
+108.474571\r
+104.347832\r
+120.000008\r
+120.000008\r
+104.347832\r
+104.347832\r
+71.111115\r
+88.888893\r
+75.294121\r
+111.627907\r
+120.000008\r
+120.000008\r
+97.959183\r
+111.627907\r
+111.627907\r
+111.627907\r
+97.959183\r
+92.307693\r
+92.307693\r
+92.307693\r
+92.307693\r
+120.000008\r
+111.627907\r
+111.627907\r
+86.486488\r
+85.333336\r
+85.333336\r
+90.140846\r
+95.522392\r
+101.587311\r
+101.587311\r
+104.918037\r
+104.347832\r
+104.347832\r
+111.627907\r
+120.000008\r
+97.959183\r
+104.347832\r
+111.627907\r
+88.888893\r
+80.000000\r
+81.012657\r
+85.333336\r
+85.333336\r
+86.486488\r
+91.428574\r
+90.140846\r
+91.428574\r
+96.969704\r
+96.969704\r
+95.522392\r
+95.522392\r
+95.522392\r
+96.969704\r
+96.969704\r
+98.461533\r
+104.918022\r
+97.959183\r
+97.959183\r
+97.959183\r
+104.347832\r
+120.000008\r
+120.000008\r
+92.307693\r
+92.307693\r
+77.108429\r
+79.012344\r
+75.294121\r
+75.294121\r
+76.190483\r
+76.190483\r
+80.000008\r
+81.012657\r
+85.333336\r
+85.333336\r
+85.333336\r
+85.333336\r
+85.333336\r
+90.140846\r
+90.140846\r
+91.428574\r
+96.969704\r
+98.461533\r
+120.000008\r
+120.000008\r
+104.347832\r
+97.959183\r
+97.959183\r
+104.918037\r
+120.000008\r
+120.000008\r
+120.000008\r
+104.347832\r
+92.307693\r
+72.727272\r
+72.727272\r
+76.190483\r
+84.210533\r
+88.888901\r
+120.000008\r
+104.347832\r
+120.000008\r
+120.000008\r
+111.627907\r
+92.307693\r
+97.959183\r
+97.959183\r
+111.627907\r
+120.000008\r
+120.000008\r
+97.959183\r
+97.959183\r
+104.347832\r
+104.347832\r
+104.347832\r
+111.627907\r
+120.000008\r
+97.959183\r
+104.347832\r
+97.959183\r
+97.959183\r
+84.210526\r
+94.117653\r
+96.969704\r
+110.344841\r
+120.000008\r
+97.959183\r
+97.959183\r
+104.347832\r
+97.959183\r
+104.347832\r
+97.959183\r
+97.959183\r
+111.627907\r
+120.000008\r
+92.307693\r
+92.307693\r
+98.461533\r
+98.461533\r
+104.918022\r
+111.627907\r
+111.627907\r
+92.307693\r
+97.959183\r
+92.307693\r
+92.307693\r
+92.307693\r
+92.307693\r
+92.307693\r
+57.657658\r
+90.140846\r
+90.140846\r
+95.522392\r
+101.587311\r
+101.587311\r
+108.474586\r
+111.627907\r
+97.959183\r
+111.627907\r
+120.000008\r
+92.307693\r
+74.418610\r
+74.418610\r
+74.418610\r
+74.418610\r
+76.190483\r
+72.727280\r
+76.190483\r
+76.190483\r
+69.565224\r
+66.666672\r
+54.700855\r
+56.637169\r
+56.637169\r
+71.910110\r
+90.140846\r
+90.140846\r
+72.727272\r
+72.727272\r
+72.727272\r
+72.727272\r
+55.172413\r
+57.142857\r
+55.172413\r
+90.140846\r
+95.522392\r
+101.587311\r
+101.587311\r
+71.910110\r
+74.418610\r
+46.376812\r
+40.000000\r
+95.522392\r
+0\r
+0\r
--- /dev/null
+CC=gcc
+CFLAGS=-g -Wall
+
+SINENC_OBJ = sinenc.o globals.o initenc.o four1.o refine.o spec.o
+SINEDEC_OBJ = sinedec.o globals.o initenc.o initdec.o four1.o synth.o
+
+all: sinenc sinedec
+
+sinenc: $(SINENC_OBJ)
+ $(CC) $(CFLAGS) $(SINENC_OBJ) -o sinenc -lm
+
+sinedec: $(SINEDEC_OBJ)
+ $(CC) $(CFLAGS) $(SINEDEC_OBJ) -o sinedec -lm
+
+%.o : %.c
+ $(CC) -c $(CFLAGS) $< -o $@
+
+clean :
+ rm -f *.o *~ src/*~
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: defines.h
+ AUTHOR......: David Rowe
+ DATE CREATED: 23/4/93
+
+ Defines and structures used throughout the codec.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+/*---------------------------------------------------------------------------*\
+
+ DEFINES
+
+\*---------------------------------------------------------------------------*/
+
+/* General defines */
+
+#define N 80 /* number of samples per frame */
+#define MAX_AMP 80 /* maximum number of harmonics */
+#define PI 3.141592654 /* mathematical constant */
+#define TWO_PI 6.283185307 /* mathematical constant */
+#define FC 4000 /* cut-off frequency */
+
+/* Pitch estimation defines */
+
+#define M 320 /* pitch analysis frame size */
+#define P_MIN 20 /* minimum pitch */
+#define P_MAX 160 /* maximum pitch */
+
+/* Encoder defines */
+
+#define AW_ENC 512 /* maximum encoder analysis window size */
+#define FFT_ENC 512 /* size of FFT used for encoder analysis */
+
+/* Decoder defines */
+
+#define AW_DEC 160 /* number of samples in synthesis window */
+#define FFT_DEC 512 /* number of points in DFT */
+#define TW 40 /* Trapezoidal UV synthesis window overlap */
+#define MAX_STR 256
+
+/*---------------------------------------------------------------------------*\
+
+ TYPEDEFS
+
+\*---------------------------------------------------------------------------*/
+
+/* Complex number */
+
+typedef struct {
+ float real;
+ float imag;
+} COMP;
+
+
+/* Structure to hold unquantised model parameters for one frame */
+
+typedef struct {
+ float Wo; /* fundamental frequency estimate in radians */
+ int L; /* number of harmonics over the current frame */
+ float v[MAX_AMP]; /* voicing measures */
+ float A[MAX_AMP]; /* average magnitude/unit frequency samples */
+ float phi[MAX_AMP]; /* phase of each harmonic */
+} MODEL;
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: four1.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 20/2/95
+
+ Numerical Recipies in C FFT function. I have a nasty licence so please
+ replace me.
+
+\*---------------------------------------------------------------------------*/
+
+#include <math.h>
+
+#define SWAP(a,b) tempr=(a);(a)=(b);(b)=tempr
+
+void four1(data,nn,isign)
+float data[];
+int nn,isign;
+{
+ int n,mmax,m,j,istep,i;
+ double wtemp,wr,wpr,wpi,wi,theta;
+ float tempr,tempi;
+
+ n=nn << 1;
+ j=1;
+ for (i=1;i<n;i+=2) {
+ if (j > i) {
+ SWAP(data[j],data[i]);
+ SWAP(data[j+1],data[i+1]);
+ }
+ m=n >> 1;
+ while (m >= 2 && j > m) {
+ j -= m;
+ m >>= 1;
+ }
+ j += m;
+ }
+ mmax=2;
+ while (n > mmax) {
+ istep=2*mmax;
+ theta=6.28318530717959/(isign*mmax);
+ wtemp=sin(0.5*theta);
+ wpr = -2.0*wtemp*wtemp;
+ wpi=sin(theta);
+ wr=1.0;
+ wi=0.0;
+ for (m=1;m<mmax;m+=2) {
+ for (i=m;i<=n;i+=istep) {
+ j=i+mmax;
+ tempr=wr*data[j]-wi*data[j+1];
+ tempi=wr*data[j+1]+wi*data[j];
+ data[j]=data[i]-tempr;
+ data[j+1]=data[i+1]-tempi;
+ data[i] += tempr;
+ data[i+1] += tempi;
+ }
+ wr=(wtemp=wr)*wpr-wi*wpi+wr;
+ wi=wi*wpr+wtemp*wpi+wi;
+ }
+ mmax=istep;
+ }
+}
+
+#undef SWAP
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: four1.h
+ AUTHOR......: David Rowe
+ DATE CREATED: 20/2/95
+
+ Numerical Recipies in C FFT function. I have a nasty licence so please
+ replace me.
+
+\*---------------------------------------------------------------------------*/
+
+#ifndef __FOUR1__
+#define __FOUR1__
+
+void four1(float x[], int n, int isign);
+
+#endif /* __FOUR1__ */
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: globals.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 11/5/94
+
+ Globals for sinusoidal speech coder.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h" /* global defines for coder */
+
+/* Globals used in encoder and decoder */
+
+int frames; /* number of frames processed so far */
+float Sn[M+AW_ENC/2]; /* float input speech samples */
+MODEL model; /* model parameters for the current frame */
+int Nw; /* number of samples in analysis window */
+float sig; /* energy of current frame */
+
+/* Globals used in encoder */
+
+float w[AW_ENC]; /* time domain hamming window */
+COMP Sw[FFT_ENC]; /* DFT of current frame */
+
+/* Globals used in decoder */
+
+COMP Sw_[FFT_ENC]; /* DFT of all voiced synthesised signal */
+float Sn_[AW_DEC]; /* synthesised speech */
+float Pn[AW_DEC]; /* time domain Parzen (trapezoidal) window */
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: globals.h
+ AUTHOR......: David Rowe
+ DATE CREATED: 1/11/94
+
+ Globals for sinusoidal speech coder.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+/* Globals used in encoder and decoder */
+
+extern int frames; /* number of frames processed so far */
+extern float Sn[]; /* float input speech samples */
+extern MODEL model; /* model parameters for the current frame */
+extern int Nw; /* number of samples in analysis window */
+extern float sig; /* energy of current frame */
+
+/* Globals used in encoder */
+
+extern float w[]; /* time domain hamming window */
+extern COMP W[]; /* frequency domain hamming window */
+extern COMP Sw[]; /* DFT of current frame */
+extern COMP Sw_[]; /* DFT of all voiced synthesised signal */
+
+/* Globals used in decoder */
+
+extern float Sn_[]; /* output synthesised speech samples */
+extern float Pn[]; /* time domain Parzen (trapezoidal) window */
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: initdec.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 11/5/94
+
+ Initialises sinusoidal speech decoder globals.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h" /* sinusoidal header file */
+
+void init_decoder() {
+ int i;
+ float win;
+
+ /* Generate Parzen window in time domain */
+
+ win = 0.0;
+ for(i=0; i<N/2-TW; i++)
+ Pn[i] = 0.0;
+ win = 0.0;
+ for(i=N/2-TW; i<N/2+TW; win+=1.0/(2*TW), i++ )
+ Pn[i] = win;
+ for(i=N/2+TW; i<3*N/2-TW; i++)
+ Pn[i] = 1.0;
+ win = 1.0;
+ for(i=3*N/2-TW; i<3*N/2+TW; win-=1.0/(2*TW), i++)
+ Pn[i] = win;
+ for(i=3*N/2+TW; i<2*N; i++)
+ Pn[i] = 0.0;
+
+ /* Init output buffer */
+
+ for(i=0; i<AW_DEC; i++)
+ Sn_[i] = 0.0;
+
+}
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE: initenc.c
+ AUTHOR: David Rowe
+ DATE CREATED: 11/5/94
+
+ Initialises sinusoidal speech encoder.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h" /* sinusoidal header file */
+
+void init_encoder()
+{
+ int i;
+
+ frames = 0;
+
+ /* Initialise sample buffer memories */
+
+ for(i=0; i<M+AW_ENC/2; i++)
+ Sn[i] = 1.0;
+
+}
+
+float make_window(int Nw)
+{
+ float m;
+ int i,j;
+
+ /* Generate Hamming window centered on analysis window */
+
+ m = 0.0;
+ for(i=0; i<AW_ENC/2-Nw/2; i++)
+ w[i] = 0.0;
+ for(i=AW_ENC/2-Nw/2,j=0; i<AW_ENC/2+Nw/2; i++,j++) {
+ w[i] = 0.5 - 0.5*cos(TWO_PI*j/(Nw-1));
+ m += w[i]*w[i];
+ }
+ for(i=AW_ENC/2+Nw/2; i<AW_ENC; i++)
+ w[i] = 0.0;
+
+ /* Normalise - this might be useful later on */
+
+ m = 1.0/sqrt(m*FFT_ENC);
+ for(i=0; i<AW_ENC; i++) {
+ w[i] *= m;
+ }
+
+ return(m);
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: nlp.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 23/3/93
+
+ Non Linear Pitch (NLP) estimation functions.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+/*---------------------------------------------------------------------------*\
+
+ DEFINES
+
+\*---------------------------------------------------------------------------*/
+
+#define PMAX_M 600 /* maximum NLP analysis window size */
+#define COEFF 0.95 /* noth filter parameter */
+#define NTAP 48 /* Decimation LPF order */
+#define PE_FFT_SIZE 512 /* DFT size for pitch estimation */
+#define DEC 5 /* decimation factor */
+#define SAMPLE_RATE 8000
+#define PI 3.141592654 /* mathematical constant */
+#define CNLP 0.5 /* post processor constant */
+
+/*---------------------------------------------------------------------------*\
+
+ GLOBALS
+
+\*---------------------------------------------------------------------------*/
+
+/* 48 tap 600Hz low pass FIR filter coefficients */
+
+float nlp_fir[] = {
+ -1.0818124e-03,
+ -1.1008344e-03,
+ -9.2768838e-04,
+ -4.2289438e-04,
+ 5.5034190e-04,
+ 2.0029849e-03,
+ 3.7058509e-03,
+ 5.1449415e-03,
+ 5.5924666e-03,
+ 4.3036754e-03,
+ 8.0284511e-04,
+ -4.8204610e-03,
+ -1.1705810e-02,
+ -1.8199275e-02,
+ -2.2065282e-02,
+ -2.0920610e-02,
+ -1.2808831e-02,
+ 3.2204775e-03,
+ 2.6683811e-02,
+ 5.5520624e-02,
+ 8.6305944e-02,
+ 1.1480192e-01,
+ 1.3674206e-01,
+ 1.4867556e-01,
+ 1.4867556e-01,
+ 1.3674206e-01,
+ 1.1480192e-01,
+ 8.6305944e-02,
+ 5.5520624e-02,
+ 2.6683811e-02,
+ 3.2204775e-03,
+ -1.2808831e-02,
+ -2.0920610e-02,
+ -2.2065282e-02,
+ -1.8199275e-02,
+ -1.1705810e-02,
+ -4.8204610e-03,
+ 8.0284511e-04,
+ 4.3036754e-03,
+ 5.5924666e-03,
+ 5.1449415e-03,
+ 3.7058509e-03,
+ 2.0029849e-03,
+ 5.5034190e-04,
+ -4.2289438e-04,
+ -9.2768838e-04,
+ -1.1008344e-03,
+ -1.0818124e-03
+};
+
+/*---------------------------------------------------------------------------*\
+
+ void nlp()
+
+ Determines the pitch in samples using the NLP algorithm. Returns the
+ fundamental in Hz.
+
+\*---------------------------------------------------------------------------*/
+
+float nlp(Sn,n,m,d,pmin,pmax,pitch)
+float Sn[]; /* input speech vector */
+int n; /* frames shift (no. new samples in Sn[]) */
+int m; /* analysis window size */
+int d; /* additional delay (used for testing) */
+int pmin; /* minimum pitch value */
+int pmax; /* maximum pitch value */
+float *pitch; /* estimated pitch */
+{
+ static float sq[PMAX_M]; /* squared speech samples */
+ float notch; /* current notch filter output */
+ static float mem_x,mem_y; /* memory for notch filter */
+ static float mem_fir[NTAP]; /* decimation FIR filter memory */
+ COMP Fw[PE_FFT_SIZE]; /* DFT of squared signal */
+
+ int gmax_bin; /* DFT bin where global maxima occurs */
+ float gmax; /* global maxima value */
+ float lmax; /* current local maxima value */
+ int lmax_bin; /* bin of current local maxima */
+ float cmax; /* chosen local maxima value */
+ int cmax_bin; /* bin of chosen local maxima */
+
+ int mult; /* current submultiple */
+ int min_bin; /* lowest possible bin */
+ int bmin,bmax; /* range of local maxima search */
+ float thresh; /* threshold for submultiple selection */
+
+ float F0; /* fundamental frequency */
+ int i,j,b;
+
+ /* Square, notch filter at DC, and LP filter vector */
+
+ for(i=0; i<n; i++) /* square speech samples */
+ sq[i+d+m-n] = Sn[i]*Sn[i];
+
+ for(i=m-n+d; i<m+d; i++) { /* notch filter at DC */
+ notch = sq[i] - mem_x;
+ notch += COEFF*mem_y;
+ mem_x = sq[i];
+ mem_y = notch;
+ sq[i] = notch;
+ }
+
+ for(i=m-n+d; i<m+d; i++) { /* FIR filter vector */
+
+ for(j=0; j<NTAP-1; j++)
+ mem_fir[j] = mem_fir[j+1];
+ mem_fir[NTAP-1] = sq[i];
+
+ sq[i] = 0.0;
+ for(j=0; j<NTAP; j++)
+ sq[i] += mem_fir[j]*nlp_fir[j];
+ }
+
+ /* Decimate and DFT */
+
+ for(i=0; i<PE_FFT_SIZE; i++) {
+ Fw[i].real = 0.0;
+ Fw[i].imag = 0.0;
+ }
+ for(i=0; i<m/DEC; i++)
+ Fw[i].real = sq[i*DEC]*(0.5 - 0.5*cos(2*PI*i/(m/DEC-1)));
+ four1(&Fw[-1].imag,PE_FFT_SIZE,1);
+ for(i=0; i<PE_FFT_SIZE; i++)
+ Fw[i].real = Fw[i].real*Fw[i].real + Fw[i].imag*Fw[i].imag;
+
+ /* find global peak within limits, this corresponds to F0 estimate */
+
+ gmax = 0.0;
+ for(i=PE_FFT_SIZE*DEC/pmax; i<=PE_FFT_SIZE*DEC/pmin; i++) {
+ if (Fw[i].real > gmax) {
+ gmax = Fw[i].real;
+ gmax_bin = i;
+ }
+ }
+
+ /* Now post process estimate by searching submultiples */
+
+ mult = 2;
+ min_bin = PE_FFT_SIZE*DEC/pmax;
+ thresh = CNLP*gmax;
+ cmax_bin = gmax_bin;
+
+ while(gmax_bin/mult >= min_bin) {
+
+ b = gmax_bin/mult; /* determine search interval */
+ bmin = 0.8*b;
+ bmax = 1.2*b;
+ if (bmin < min_bin)
+ bmin = min_bin;
+
+ lmax = 0;
+ for (b=bmin; b<=bmax; b++) /* look for maximum in interval */
+ if (Fw[b].real > lmax) {
+ lmax = Fw[b].real;
+ lmax_bin = b;
+ }
+
+ if (lmax > thresh)
+ if (lmax > Fw[lmax_bin-1].real && lmax > Fw[lmax_bin+1].real) {
+ cmax = lmax;
+ cmax_bin = lmax_bin;
+ }
+
+ mult++;
+ }
+
+ F0 = (float)cmax_bin*SAMPLE_RATE/(PE_FFT_SIZE*DEC);
+ *pitch = SAMPLE_RATE/F0;
+
+ /* Shift samples in buffer to make room for new samples */
+
+ for(i=0; i<m-n+d; i++)
+ sq[i] = sq[i+n];
+
+ return(F0);
+}
+
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: refine.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Functions for refining the pitch estimate using the harmonic sum method.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h"
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTION....: dft_speech
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Finds the DFT of the current speech input speech frame.
+
+ INPUT.......: global float Sn[] speech samples
+ OUTPUT......: global float Sw[] DFT of speech samples
+
+\*---------------------------------------------------------------------------*/
+
+void dft_speech()
+{
+ int i;
+
+ for(i=0; i<FFT_ENC; i++) {
+ Sw[i].real = 0.0;
+ Sw[i].imag = 0.0;
+ }
+
+ /* centre analysis window on time axis */
+
+ for(i=0; i<AW_ENC/2; i++)
+ Sw[i].real = Sn[i+AW_ENC/2]*w[i+AW_ENC/2];
+ for(i=FFT_ENC-AW_ENC/2; i<FFT_ENC; i++)
+ Sw[i].real = Sn[i-FFT_ENC+AW_ENC/2]*w[i-FFT_ENC+AW_ENC/2];
+
+ four1(&Sw[-1].imag,FFT_ENC,-1);
+}
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTION....: two_stage_pitch_refinement
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Refines the current pitch estimate using the harmonic sum pitch
+ estimation technique.
+
+\*---------------------------------------------------------------------------*/
+
+void two_stage_pitch_refinement()
+{
+ float pmin,pmax,pstep; /* pitch refinment minimum, maximum and step */
+
+ /* Coarse refinement */
+
+ pmax = TWO_PI/model.Wo + 5;
+ pmin = TWO_PI/model.Wo - 5;
+ pstep = 1.0;
+ hs_pitch_refinement(pmin,pmax,pstep);
+
+ /* Fine refinement */
+
+ pmax = TWO_PI/model.Wo + 1;
+ pmin = TWO_PI/model.Wo - 1;
+ pstep = 0.25;
+ hs_pitch_refinement(pmin,pmax,pstep);
+
+ /* Limit range */
+
+ if (model.Wo < TWO_PI/P_MAX)
+ model.Wo = TWO_PI/P_MAX;
+ if (model.Wo > TWO_PI/P_MIN)
+ model.Wo = TWO_PI/P_MIN;
+
+ model.L = floor(PI/model.Wo);
+}
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTION....: hs_pitch_refinement
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Harmonic sum pitch refinement function.
+
+ pmin pitch search range minimum
+ pmax pitch search range maximum
+ step pitch search step size
+ model current pitch estimate in model.Wo
+
+ model refined pitch estimate in model.Wo
+
+\*---------------------------------------------------------------------------*/
+
+void hs_pitch_refinement(float pmin, float pmax, float pstep)
+{
+ int m; /* loop variable */
+ int b; /* bin for current harmonic centre */
+ float E; /* energy for current pitch*/
+ float Wo; /* current "test" fundamental freq. */
+ float Wom; /* Wo that maximises E */
+ float Em; /* mamimum energy */
+ float r; /* number of rads/bin */
+ float p; /* current pitch */
+
+ /* Initialisation */
+
+ model.L = PI/model.Wo; /* use initial pitch est. for L */
+ Em = 0.0;
+ r = TWO_PI/FFT_ENC;
+
+ /* Determine harmonic sum for a range of Wo values */
+
+ for(p=pmin; p<=pmax; p+=pstep) {
+ E = 0.0;
+ Wo = TWO_PI/p;
+
+ /* Sum harmonic magnitudes */
+
+ for(m=1; m<=model.L; m++) {
+ b = floor(m*Wo/r + 0.5);
+ E += Sw[b].real*Sw[b].real + Sw[b].imag*Sw[b].imag;
+ }
+
+ /* Compare to see if this is a maximum */
+
+ if (E > Em) {
+ Em = E;
+ Wom = Wo;
+ }
+ }
+
+ model.Wo = Wom;
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: sine.h
+ AUTHOR......: David Rowe
+ DATE CREATED: 1/11/94
+
+ Header file for Sinusoidal coder.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+/*---------------------------------------------------------------------------*\
+
+ INCLUDES
+
+\*---------------------------------------------------------------------------*/
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <math.h>
+
+#include "defines.h" /* defines for sinusoidal coder */
+#include "globals.h" /* external globals */
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTIONS
+
+\*---------------------------------------------------------------------------*/
+
+/* functions in refine.c */
+
+void dft_speech();
+void two_stage_pitch_refinement();
+void hs_pitch_refinement(float pmin, float pmax, float pstep);
+
+/* functions in spec.c */
+
+void estimate_amplitudes();
+void estimate_voicing();
+void estimate_voicing_av();
+float voicing(int lower, int upper);
+
+/* functions in four1.c */
+
+void four1();
+
+/* functions in synth.c */
+
+void synthesise_mixed();
+
+/* functions in initenc.c and initdec.c */
+
+void init_encoder(void);
+float make_window();
+void init_decoder();
+
+/* functions in gasdev.c */
+
+float gasdev();
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: sinedec.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 20/2/95
+
+ Decoder program for sinudoidal codec.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include <string.h>
+#include "sine.h"
+
+/*---------------------------------------------------------------------------*\
+
+ switch_present()
+
+ Searches the command line arguments for a "switch". If the switch is
+ found, returns the command line argument where it ws found, else returns
+ NULL.
+
+\*---------------------------------------------------------------------------*/
+
+int switch_present(sw,argc,argv)
+register char sw[]; /* switch in string form */
+register int argc; /* number of command line arguments */
+register char *argv[]; /* array of command line arguments in string form */
+{
+ register int i; /* loop variable */
+
+ for(i=1; i<argc; i++)
+ if (!strcmp(sw,argv[i]))
+ return(i);
+
+ return 0;
+}
+
+/*---------------------------------------------------------------------------*\
+
+ MAIN
+
+\*---------------------------------------------------------------------------*/
+
+int main(int argc, char *argv[])
+{
+ FILE *fmodel; /* file of model parameters from encoder */
+ FILE *fout; /* output speech file */
+ FILE *fin; /* input speech file */
+ short buf[N]; /* input/output buffer */
+ int i; /* loop variable */
+ int length; /* number of frames so far */
+
+ char out_file[MAX_STR];
+ int arg;
+
+ if (argc < 3) {
+ printf("usage: sinedec InputFile ModelFile [-o OutputFile]\n");
+ exit(0);
+ }
+
+ /* Interpret command line arguments -------------------------------------*/
+
+ /* Input file */
+
+ if ((fin = fopen(argv[1],"rb")) == NULL) {
+ printf("Error opening input speech file: %s\n",argv[1]);
+ exit(1);
+ }
+
+ /* Model parameter file */
+
+ if ((fmodel = fopen(argv[2],"rb")) == NULL) {
+ printf("Error opening model file: %s\n",argv[2]);
+ exit(1);
+ }
+
+ /* Output file */
+
+ if ((arg = switch_present("-o",argc,argv))) {
+ if ((fout = fopen(argv[arg+1],"wb")) == NULL) {
+ printf("Error opening output speech file: %s\n",argv[arg+1]);
+ exit(1);
+ }
+ strcpy(out_file,argv[arg+1]);
+ }
+ else
+ fout = NULL;
+
+ /* Length (no. of frames) */
+
+ if ((length = switch_present("-l",argc,argv))) {
+ length = atoi(argv[length+1]);
+ if (length < 0) {
+ printf("Error in length: %d\n",length);
+ exit(1);
+ }
+ }
+ else
+ length = 32000;
+
+ /* Initialise ------------------------------------------------------------*/
+
+ init_decoder();
+ init_encoder();
+ Nw = 220;
+ make_window(Nw);
+
+ /* Main loop ------------------------------------------------------------*/
+
+ frames = 0;
+ while(fread(&model,sizeof(model),1,fmodel) /*&& frames < 1200*/) {
+ frames++;
+
+ /* Read input speech */
+
+ fread(buf,sizeof(short),N,fin);
+ for(i=0; i<N+AW_ENC/2; i++)
+ Sn[i] = Sn[i+N];
+ for(i=0; i<N; i++)
+ Sn[i+N+AW_ENC/2] = buf[i];
+
+ /* Synthesise speech */
+
+ if (fout != NULL) {
+
+ synthesise_mixed(Pn,&model,Sn_);
+
+ /* Save output speech to disk */
+
+ for(i=0; i<N; i++) {
+ if (Sn_[i] > 32767.0)
+ buf[i] = 32767;
+ else if (Sn_[i] < -32767.0)
+ buf[i] = -32767;
+ else
+ buf[i] = Sn_[i];
+ }
+ fwrite(buf,sizeof(short),N,fout);
+ }
+
+ }
+
+ if (fout != NULL)
+ fclose(fout);
+
+ return 0;
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: sinenc.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 20/2/95
+
+ Sinusoidal speech encoder program using external (Matlab) pitch estimator.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h"
+
+/*---------------------------------------------------------------------------*\
+
+ MAIN
+
+\*---------------------------------------------------------------------------*/
+
+int main(int argc, char *argv[])
+{
+ FILE *fin; /* input speech sample file */
+ FILE *fmodel; /* output file of model parameters */
+ FILE *fp; /* input text file containing pitch estimates */
+ short buf[N]; /* input speech sample buffer */
+ int length; /* number of frames to process */
+ float pitch; /* current pitch estimate from external pitch file */
+ int i; /* loop variable */
+ FILE *fref; /* optional output file with refined pitch estimate */
+
+ if (argc < 5) {
+ printf("usage: sinenc InputFile ModelFile Frames PitchFile\n");
+ exit(1);
+ }
+
+ /* Interpret command line arguments -------------------------------------*/
+
+ if ((fin = fopen(argv[1],"rb")) == NULL) {
+ printf("Error opening input file: %s\n",argv[1]);
+ exit(1);
+ }
+
+ if ((fmodel = fopen(argv[2],"wb")) == NULL) {
+ printf("Error opening output model file: %s\n",argv[2]);
+ exit(1);
+ }
+
+ length = atoi(argv[3]);
+
+ if ((fp = fopen(argv[4],"rt")) == NULL) {
+ printf("Error opening input pitch file: %s\n",argv[4]);
+ exit(1);
+ }
+
+ if (argc > 5) {
+ if ((fref = fopen(argv[5],"wt")) == NULL) {
+ printf("Error opening output pitch refinement file: %s\n",argv[5]);
+ exit(1);
+ }
+ }
+ else
+ fref = NULL;
+
+ init_encoder();
+ Nw = 220;
+ make_window(Nw);
+
+ /* Main loop ------------------------------------------------------------*/
+
+ while(fread(buf,sizeof(short),N,fin) == N && frames != length) {
+ frames++;
+
+ /* Update input speech buffers */
+
+ for(i=0; i<N+AW_ENC/2; i++)
+ Sn[i] = Sn[i+N];
+ for(i=0; i<N; i++)
+ Sn[i+N+AW_ENC/2] = buf[i];
+
+ /* Estimate pitch */
+
+ if (frames > 2) {
+ fscanf(fp,"%f\n",&pitch);
+ if (pitch > P_MAX) pitch = P_MAX;
+ if (pitch < P_MIN) pitch = P_MIN;
+ }
+ else
+ pitch = P_MIN;
+
+ /* construct analysis window */
+
+ model.Wo = TWO_PI/pitch;
+
+ /* estimate and model parameters */
+
+ dft_speech();
+ two_stage_pitch_refinement();
+ estimate_amplitudes();
+
+ /* save model parameters */
+
+ if (fref != NULL && frames > 2)
+ fprintf(fref,"%f\n",model.Wo);
+ fwrite(&model,sizeof(model),1,fmodel);
+ printf("frame: %d\r",frames);
+ }
+
+ /* close files and exit */
+
+ if (fref != NULL) fclose(fref);
+ fclose(fin);
+ fclose(fmodel);
+
+ return 0;
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: spec.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Functions for estimating the complex amplitude of harmonics.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h"
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTION....: estimate_amplitudes
+ AUTHOR......: David Rowe
+ DATE CREATED: 27/5/94
+
+ Estimates the complex amplitudes of the harmonics. Also generates
+ all voiced synthetic spectrum for later voicing estimation.
+
+ INPUT.......: global float Sw[] DFT of speech
+ global MODEL model contains parameters L and Wo
+
+ OUTPUT......: global float Sw_[] DFT of all voiced synthesised speech
+ global MODEL model contains parameters A[] and phi[]
+
+\*---------------------------------------------------------------------------*/
+
+void estimate_amplitudes()
+{
+ int i,m; /* loop variables */
+ int am,bm; /* bounds of current harmonic */
+ int b; /* DFT bin of centre of current harmonic */
+ float den; /* denominator of amplitude expression */
+ float r; /* number of rads/bin */
+
+ r = TWO_PI/FFT_ENC;
+
+ for(m=1; m<=model.L; m++) {
+ den = 0.0;
+ am = floor((m - 0.5)*model.Wo/r + 0.5);
+ bm = floor((m + 0.5)*model.Wo/r + 0.5);
+ b = floor(m*model.Wo/r + 0.5);
+
+ /* Estimate ampltude of harmonic */
+
+ den = 0.0;
+ for(i=am; i<bm; i++) {
+ den += Sw[i].real*Sw[i].real + Sw[i].imag*Sw[i].imag;
+ }
+
+ model.A[m] = sqrt(den);
+
+ /* Estimate phase of harmonic */
+
+ model.phi[m] = atan2(Sw[b].imag,Sw[b].real);
+ }
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: synth.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 20/2/95
+
+ Function for synthesising a speech signal in the frequency domain from
+ the sinusodal model parameters.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#include "sine.h"
+
+void synthesise_mixed(Pn,model,Sn_)
+float Pn[]; /* time domain Parzen window */
+MODEL *model; /* ptr to model parameters for this frame */
+float Sn_[]; /* time domain synthesised signal */
+{
+ int i,l,j,b; /* loop variables */
+ COMP Nw[FFT_DEC]; /* DFT of noise signal */
+ COMP Sw_[FFT_DEC]; /* DFT of synthesised signal */
+
+ /* Update memories */
+
+ for(i=0; i<N-1; i++) {
+ Sn_[i] = Sn_[i+N];
+ }
+ Sn_[N-1] = 0.0;
+
+ for(i=0; i<FFT_DEC; i++) {
+ Sw_[i].real = 0.0;
+ Sw_[i].imag = 0.0;
+ }
+
+ /* Now set up frequency domain synthesised speech */
+
+ for(l=1; l<=model->L; l++) {
+ b = floor(l*model->Wo*FFT_DEC/TWO_PI + 0.5);
+ Sw_[b].real = model->A[l]*cos(model->phi[l]);
+ Sw_[b].imag = model->A[l]*sin(model->phi[l]);
+ Sw_[FFT_DEC-b].real = Sw_[b].real;
+ Sw_[FFT_DEC-b].imag = -Sw_[b].imag;
+ }
+
+ /* Perform inverse DFT */
+
+ four1(&Sw_[-1].imag,FFT_DEC,1);
+
+ /* Overlap add to previous samples */
+
+ for(i=0; i<N-1; i++) {
+ Sn_[i] += Sw_[FFT_DEC-N+1+i].real*Pn[i];
+ }
+ for(i=N-1,j=0; i<2*N; i++,j++)
+ Sn_[i] = Sw_[j].real*Pn[i];
+}
+
--- /dev/null
+/*---------------------------------------------------------------------------*\
+
+ FILE........: tnlp.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 23/3/93
+
+ Test program for non linear pitch estimation functions.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2009 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License version 2, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+*/
+
+#define N 160 /* frame size */
+#define M 320 /* pitch analysis window size */
+#define PITCH_MIN 20
+#define PITCH_MAX 133
+#define TNLP
+
+int frames;
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <math.h>
+#include "four1.c"
+#include "nlpl.c"
+
+/*---------------------------------------------------------------------------*\
+
+ FUNCTIONS
+
+\*---------------------------------------------------------------------------*/
+
+void swap(buf,n)
+short buf[]; /* array of speech samples */
+int n; /* number of speech samples */
+{
+ int i;
+ short a,b;
+
+ for(i=0; i<n; i++) {
+ a = buf[i] & 0xff;
+ b = (buf[i] >> 8) & 0xff;
+ buf[i] = (a << 8) | b;
+ }
+}
+
+void short_to_float(b,s,n)
+short b[]; /* buffer of short speech samples */
+float s[]; /* buffer of float speech samples */
+int n; /* number of speech samples */
+{
+ int i;
+
+ for(i=0; i<n; i++)
+ s[i] = (float)b[i];
+}
+
+/*---------------------------------------------------------------------------*\
+
+ MAIN
+
+\*---------------------------------------------------------------------------*/
+
+void main(argc,argv)
+int argc;
+char *argv[];
+{
+ FILE *fin,*fout;
+ short buf[N];
+ float Sn[N];
+ float pitch;
+ int i;
+ int pbin;
+
+ if (argc == 3) {
+
+ /* Input file */
+
+ if ((fin = fopen(argv[1],"rb")) == NULL) {
+ printf("Error opening input speech file: %s\n",argv[1]);
+ exit(1);
+ }
+
+ /* Output file */
+
+ if ((fout = fopen(argv[2],"wt")) == NULL) {
+ printf("Error opening output text file: %s\n",argv[2]);
+ exit(1);
+ }
+
+ frames = 0;
+ pbin = 102;
+ while(fread(buf,sizeof(short),N,fin)) {
+ frames++;
+ short_to_float(buf,Sn,N);
+ nlpl(Sn,N,M,N-NTAP/2,PITCH_MIN,PITCH_MAX,&pitch,&pbin);
+
+ /* Compensate for delay in C version compared to Matlab */
+
+ if (frames > 2)
+ fprintf(fout,"%f\n",pitch);
+
+ printf("frame: %d pitch: %f\n",frames,pitch);
+
+ }
+ fprintf(fout,"0\n0\n");
+
+ fclose(fin);
+ fclose(fout);
+ }
+ else
+ printf("\nusage: tnlp InputFile OutputFile\n");
+}
+
+