Daniel@0: /***********************************************************************/ Daniel@0: /* */ Daniel@0: /* svm_learn.h */ Daniel@0: /* */ Daniel@0: /* Declarations for learning module of Support Vector Machine. */ Daniel@0: /* */ Daniel@0: /* Author: Thorsten Joachims */ Daniel@0: /* Date: 02.07.02 */ Daniel@0: /* */ Daniel@0: /* Copyright (c) 2002 Thorsten Joachims - All rights reserved */ Daniel@0: /* */ Daniel@0: /* This software is available for non-commercial use only. It must */ Daniel@0: /* not be modified and distributed without prior permission of the */ Daniel@0: /* author. The author is not responsible for implications from the */ Daniel@0: /* use of this software. */ Daniel@0: /* */ Daniel@0: /***********************************************************************/ Daniel@0: Daniel@0: #ifndef SVM_LEARN Daniel@0: #define SVM_LEARN Daniel@0: Daniel@0: void svm_learn_classification(DOC **, double *, long, long, LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE *, MODEL *, Daniel@0: double *); Daniel@0: void svm_learn_regression(DOC **, double *, long, long, LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE **, MODEL *); Daniel@0: void svm_learn_ranking(DOC **, double *, long, long, LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE **, MODEL *); Daniel@0: void svm_learn_optimization(DOC **, double *, long, long, LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE *, MODEL *, Daniel@0: double *); Daniel@0: long optimize_to_convergence(DOC **, long *, long, long, LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE *, SHRINK_STATE *, Daniel@0: MODEL *, long *, long *, double *, Daniel@0: double *, double *, Daniel@0: TIMING *, double *, long, long); Daniel@0: long optimize_to_convergence_sharedslack(DOC **, long *, long, long, Daniel@0: LEARN_PARM *, Daniel@0: KERNEL_PARM *, KERNEL_CACHE *, SHRINK_STATE *, Daniel@0: MODEL *, double *, double *, double *, Daniel@0: TIMING *, double *); Daniel@0: double compute_objective_function(double *, double *, double *, double, Daniel@0: long *, long *); Daniel@0: void clear_index(long *); Daniel@0: void add_to_index(long *, long); Daniel@0: long compute_index(long *,long, long *); Daniel@0: void optimize_svm(DOC **, long *, long *, long *, double, long *, long *, Daniel@0: MODEL *, Daniel@0: long, long *, long, double *, double *, double *, Daniel@0: LEARN_PARM *, CFLOAT *, KERNEL_PARM *, QP *, double *); Daniel@0: void compute_matrices_for_optimization(DOC **, long *, long *, long *, double, Daniel@0: long *, Daniel@0: long *, long *, MODEL *, double *, Daniel@0: double *, double *, long, long, LEARN_PARM *, Daniel@0: CFLOAT *, KERNEL_PARM *, QP *); Daniel@0: long calculate_svm_model(DOC **, long *, long *, double *, double *, Daniel@0: double *, double *, LEARN_PARM *, long *, Daniel@0: long *, MODEL *); Daniel@0: long check_optimality(MODEL *, long *, long *, double *, double *, Daniel@0: double *, long, Daniel@0: LEARN_PARM *,double *, double, long *, long *, long *, Daniel@0: long *, long, KERNEL_PARM *); Daniel@0: long check_optimality_sharedslack(DOC **docs, MODEL *model, long int *label, Daniel@0: double *a, double *lin, double *c, double *slack, Daniel@0: double *alphaslack, long int totdoc, Daniel@0: LEARN_PARM *learn_parm, double *maxdiff, Daniel@0: double epsilon_crit_org, long int *misclassified, Daniel@0: long int *active2dnum, Daniel@0: long int *last_suboptimal_at, Daniel@0: long int iteration, KERNEL_PARM *kernel_parm); Daniel@0: void compute_shared_slacks(DOC **docs, long int *label, double *a, Daniel@0: double *lin, double *c, long int *active2dnum, Daniel@0: LEARN_PARM *learn_parm, Daniel@0: double *slack, double *alphaslack); Daniel@0: long identify_inconsistent(double *, long *, long *, long, LEARN_PARM *, Daniel@0: long *, long *); Daniel@0: long identify_misclassified(double *, long *, long *, long, Daniel@0: MODEL *, long *, long *); Daniel@0: long identify_one_misclassified(double *, long *, long *, long, Daniel@0: MODEL *, long *, long *); Daniel@0: long incorporate_unlabeled_examples(MODEL *, long *,long *, long *, Daniel@0: double *, double *, long, double *, Daniel@0: long *, long *, long, KERNEL_PARM *, Daniel@0: LEARN_PARM *); Daniel@0: void update_linear_component(DOC **, long *, long *, double *, double *, Daniel@0: long *, long, long, KERNEL_PARM *, Daniel@0: KERNEL_CACHE *, double *, Daniel@0: CFLOAT *, double *); Daniel@0: long select_next_qp_subproblem_grad(long *, long *, double *, Daniel@0: double *, double *, long, Daniel@0: long, LEARN_PARM *, long *, long *, Daniel@0: long *, double *, long *, KERNEL_CACHE *, Daniel@0: long, long *, long *); Daniel@0: long select_next_qp_subproblem_rand(long *, long *, double *, Daniel@0: double *, double *, long, Daniel@0: long, LEARN_PARM *, long *, long *, Daniel@0: long *, double *, long *, KERNEL_CACHE *, Daniel@0: long *, long *, long); Daniel@0: long select_next_qp_slackset(DOC **docs, long int *label, double *a, Daniel@0: double *lin, double *slack, double *alphaslack, Daniel@0: double *c, LEARN_PARM *learn_parm, Daniel@0: long int *active2dnum, double *maxviol); Daniel@0: void select_top_n(double *, long, long *, long); Daniel@0: void init_shrink_state(SHRINK_STATE *, long, long); Daniel@0: void shrink_state_cleanup(SHRINK_STATE *); Daniel@0: long shrink_problem(DOC **, LEARN_PARM *, SHRINK_STATE *, KERNEL_PARM *, Daniel@0: long *, long *, long, long, long, double *, long *); Daniel@0: void reactivate_inactive_examples(long *, long *, double *, SHRINK_STATE *, Daniel@0: double *, double*, long, long, long, LEARN_PARM *, Daniel@0: long *, DOC **, KERNEL_PARM *, Daniel@0: KERNEL_CACHE *, MODEL *, CFLOAT *, Daniel@0: double *, double *); Daniel@0: Daniel@0: /* cache kernel evalutations to improve speed */ Daniel@0: KERNEL_CACHE *kernel_cache_init(long, long); Daniel@0: void kernel_cache_cleanup(KERNEL_CACHE *); Daniel@0: void get_kernel_row(KERNEL_CACHE *,DOC **, long, long, long *, CFLOAT *, Daniel@0: KERNEL_PARM *); Daniel@0: void cache_kernel_row(KERNEL_CACHE *,DOC **, long, KERNEL_PARM *); Daniel@0: void cache_multiple_kernel_rows(KERNEL_CACHE *,DOC **, long *, long, Daniel@0: KERNEL_PARM *); Daniel@0: void kernel_cache_shrink(KERNEL_CACHE *,long, long, long *); Daniel@0: void kernel_cache_reset_lru(KERNEL_CACHE *); Daniel@0: long kernel_cache_malloc(KERNEL_CACHE *); Daniel@0: void kernel_cache_free(KERNEL_CACHE *,long); Daniel@0: long kernel_cache_free_lru(KERNEL_CACHE *); Daniel@0: CFLOAT *kernel_cache_clean_and_malloc(KERNEL_CACHE *,long); Daniel@0: long kernel_cache_touch(KERNEL_CACHE *,long); Daniel@0: long kernel_cache_check(KERNEL_CACHE *,long); Daniel@0: long kernel_cache_space_available(KERNEL_CACHE *); Daniel@0: Daniel@0: void compute_xa_estimates(MODEL *, long *, long *, long, DOC **, Daniel@0: double *, double *, KERNEL_PARM *, Daniel@0: LEARN_PARM *, double *, double *, double *); Daniel@0: double xa_estimate_error(MODEL *, long *, long *, long, DOC **, Daniel@0: double *, double *, KERNEL_PARM *, Daniel@0: LEARN_PARM *); Daniel@0: double xa_estimate_recall(MODEL *, long *, long *, long, DOC **, Daniel@0: double *, double *, KERNEL_PARM *, Daniel@0: LEARN_PARM *); Daniel@0: double xa_estimate_precision(MODEL *, long *, long *, long, DOC **, Daniel@0: double *, double *, KERNEL_PARM *, Daniel@0: LEARN_PARM *); Daniel@0: void avg_similarity_of_sv_of_one_class(MODEL *, DOC **, double *, long *, KERNEL_PARM *, double *, double *); Daniel@0: double most_similar_sv_of_same_class(MODEL *, DOC **, double *, long, long *, KERNEL_PARM *, LEARN_PARM *); Daniel@0: double distribute_alpha_t_greedily(long *, long, DOC **, double *, long, long *, KERNEL_PARM *, LEARN_PARM *, double); Daniel@0: double distribute_alpha_t_greedily_noindex(MODEL *, DOC **, double *, long, long *, KERNEL_PARM *, LEARN_PARM *, double); Daniel@0: void estimate_transduction_quality(MODEL *, long *, long *, long, DOC **, double *); Daniel@0: double estimate_margin_vcdim(MODEL *, double, double, KERNEL_PARM *); Daniel@0: double estimate_sphere(MODEL *, KERNEL_PARM *); Daniel@0: double estimate_r_delta_average(DOC **, long, KERNEL_PARM *); Daniel@0: double estimate_r_delta(DOC **, long, KERNEL_PARM *); Daniel@0: double length_of_longest_document_vector(DOC **, long, KERNEL_PARM *); Daniel@0: Daniel@0: void write_model(char *, MODEL *); Daniel@0: void write_prediction(char *, MODEL *, double *, double *, long *, long *, Daniel@0: long, LEARN_PARM *); Daniel@0: void write_alphas(char *, double *, long *, long); Daniel@0: Daniel@0: typedef struct cache_parm_s { Daniel@0: KERNEL_CACHE *kernel_cache; Daniel@0: CFLOAT *cache; Daniel@0: DOC **docs; Daniel@0: long m; Daniel@0: KERNEL_PARM *kernel_parm; Daniel@0: long offset,stepsize; Daniel@0: } cache_parm_t; Daniel@0: Daniel@0: #endif