00001
#ifndef _PROTEOME_H_
00002
#define _PROTEOME_H_
00003
00004
extern char* PROTEIN_DATABASE_PATH ;
00005
extern const char* PROTEIN_DATABASE_FOLDER ;
00006
extern const char* PROTEIN_DATABASE_INDEX_FILE ;
00007
00008
extern char* PROTEIN_LIST_PATH ;
00009
extern const char* PROTEIN_LIST_FOLDER ;
00010
extern const char* PROTEIN_LIST_EXT ;
00011
00012
extern char* PEPTIDE_PATH;
00013
extern const char* PEPTIDE_FOLDER;
00014
extern const char* PEPTIDE_EXT;
00015
00016
#include "peptide_tk.h"
00017
00018
#define MAX_SIZE_PROTEIN_LIST 7000
00019
#define MAX_PROT_LENGTH 5000
00020
#define MAX_NO_REC_SITES 600
00021
00022
00023
enum
00024 {
00025 SPEPTIDE_MW
00026 };
00027
00028
enum
00029 {
00030 PROTEOLYSIS_ALL_POSSIBLE,
00031 PROTEOLYSIS_COMPLETE
00032 };
00033
00034
typedef struct
00035
{
00036
int* GI;
00037
char** filename;
00038 } ProteomeIndex;
00039
00040
typedef struct
00041
{
00042
int* GI;
00043
char** filename;
00044 } ProteinDatabaseIndex;
00045
00046
typedef struct
00047
{
00048
unsigned flag: 1;
00049
float mw;
00050
int length;
00051
char* name;
00052
char* truncated_name;
00053
char* sequence;
00054 } LProtein;
00055
00056
#include "speptide.h"
00057
00058
00059
00060
#define NO_PROTEASES 5
00061
#define MAX_PROTEASE_LENGTH 128
00062
00063
00064
00065
extern long SKIP;
00066
extern long LCO;
00067
00068
00069
typedef enum { PROTEASE_NONE,
00070 PROTEASE_TRYPSIN,
00071 PROTEASE_TRYPSIN_CHYMOTRYPSIN,
00072 PROTEASE_CHYMOTRYPSIN,
00073 PROTEASE_PEPTIDE_LIBRARY
00074 } Enzyme;
00075
00076
extern Enzyme PROTEASE;
00077
00078
int Protease_stringToIndex(
char* string);
00079
char* Protease_indexToString(
int index);
00080
int Protease_set(
int enzyme);
00081
int isRecSite(
char c);
00082
00083
00084
char* loadProtein(
char* szProteinName,
char* szFileformat);
00085
void fillLProteinArrayAtIndexFromFastaFile(LProtein* proteinLibrary,
int* index,
char* fastafilename);
00086
00087
int LProteinArray_loadLibrary(LProtein** proteinLibrary,
int* nSizeProteinLibrary,
char* szProteinListName);
00088
char* LProtein_createRestrictionSitesArray(LProtein* prot);
00089
void LProteinArray_fprint(FILE* fp, LProtein* proteinLibrary,
int size);
00090
00091
void fprintLProteinLibraryNames(FILE* fp, LProtein* proteinLibrary,
int size);
00092 LProtein** extractRibosomalProteins(FILE* fp, LProtein* proteinLibrary,
int size,
int* setsize);
00093
void extractProteinsWithName(FILE* fp, LProtein* proteinLibrary,
int size,
char* name);
00094
void printProteinSubset(LProtein*** subset);
00095
00096
00097
int loadProteomeIndex(ProteomeIndex* PROT_INDEX,
long* nProteomeSize);
00098
int loadProteinDatabaseIndex(ProteinDatabaseIndex* PDBI,
long* nProteinDatabaseSize);
00099
long calculateSizePeptideLibrary(
char* szProteomeSubsetName);
00100
00101
00102
long calculateNumberOfRecSites(
char protein[]);
00103
00104
long calculateNumberOfPeptides(
char pep[],
int options);
00105
00106
00107
void initializePeptideLibrary (PeptideLibrary* library);
00108
void fprintPeptideLibrary (FILE* fp, PeptideLibrary library);
00109
long SPeptideArray_calculateSize (
char protein[],
int skipped_sites);
00110
00111
typedef struct
00112
{
00113
char* restriction_site_array;
00114
char* boundaries_site_array;
00115
char** peptide_mark_array;
00116 LProtein* protein;
00117
int lines;
00118
int rem;
00119
int nrows_per_line;
00120
int nAminoAcidsPerLine;
00121 } ProteinCoverDisplay;
00122
00123
void ProteinCoverDisplay_fprint(FILE* pOut, ProteinCoverDisplay* pcd);
00124 Range2i* ProteinCoverDisplay_createBoundaryArray(ProteinCoverDisplay* pcd,
int* nsize);
00125
int ProteinCoverDisplay_calcCoverage(ProteinCoverDisplay* pcd);
00126
float* LProtein_getAminoAcidIonCountArray(LProtein* protein,
00127
char* ion_file,
int row_start,
int seq_col,
int abu_col,
int* nPeptides);
00128
00129
#define CHAR_PER_MARK 10
00130
00131
extern ProteomeIndex CURR_PROT_INDEX;
00132
extern LProtein* CURR_LProteinLibrary;
00133
extern SPeptide* CURR_SPeptideLibrary;
00134
extern long nSizePepLibrary;
00135
extern int nSizeProteinLibrary;
00136
00137
#include "proteome/rpeptide.h"
00138
#include "proteome/fastafile.h"
00139
#include "proteome/proteincoverdisplay.h"
00140
00141
#endif
00142