commit e0171a799fbb4458db77a10f76a6279727aac521 · anil.recoil.org/opam-repository

+86
packages/linwrap/linwrap.9.1.5/opam
···

       1
       1
       +
       opam-version: "2.0"

     

       2
       2
       +
       authors: "Francois Berenger"

     

       3
       3
       +
       maintainer: "unixjunkie@sdf.org"

     

       4
       4
       +
       homepage: "https://github.com/UnixJunkie/linwrap"

     

       5
       5
       +
       bug-reports: "https://github.com/UnixJunkie/linwrap/issues"

     

       6
       6
       +
       dev-repo: "git+https://github.com/UnixJunkie/linwrap.git"

     

       7
       7
       +
       license: "BSD-3-Clause"

     

       8
       8
       +
       build: ["dune" "build" "-p" name "-j" jobs]

     

       9
       9
       +
       install: ["cp" "bin/ecfp6.py" "%{bin}%/linwrap_ecfp6.py"]

     

       10
       10
       +
       depends: [

     

       11
       11
       +
         "base-unix"

     

       12
       12
       +
         "batteries" {>= "3.3.0"}

     

       13
       13
       +
         "bst"

     

       14
       14
       +
         "conf-liblinear-tools"

     

       15
       15
       +
         "cpm" {>= "11.0.0"}

     

       16
       16
       +
         "dokeysto" # possible perf. regr.: dokeysto_camltc -> dokeysto

     

       17
       17
       +
         "ocaml" {>= "5.0.0"} # because camltc not yet ready for ocaml>=5.0.0

     

       18
       18
       +
         "dolog" {>= "6.0.0"}

     

       19
       19
       +
         "dune" {>= "1.10"}

     

       20
       20
       +
         "minicli" {>= "5.0.0"}

     

       21
       21
       +
         "molenc"

     

       22
       22
       +
         "parany" {>= "11.0.0"}

     

       23
       23
       +
       ]

     

       24
       24
       +
       # the software can compile and install without the depopts.

     

       25
       25
       +
       # however, some tools and options will not work anymore at run-time  

     

       26
       26
       +
       depopts: [

     

       27
       27
       +
         "conf-gnuplot"

     

       28
       28
       +
         "conf-python-3"

     

       29
       29
       +
         "conf-rdkit"

     

       30
       30
       +
       ]

     

       31
       31
       +
       synopsis: "Wrapper on top of liblinear-tools"

     

       32
       32
       +
       description: """

     

       33
       33
       +
       Linwrap can be used to train a L2-regularized logistic regression classifier

     

       34
       34
       +
       or a linear Support Vector Regressor.

     

       35
       35
       +
       You can optimize C (the L2 regularization parameter), w (the class weight)

     

       36
       36
       +
       or k (the number of bags, i.e. use bagging).

     

       37
       37
       +
       You can also find the optimal classification threshold using MCC maximization,

     

       38
       38
       +
       use k-folds cross validation, parallelization, etc.

     

       39
       39
       +
       In the regression case, you can only optimize C and epsilon.

     

       40
       40
       +
       

     

       41
       41
       +
       When using bagging, each model is trained on balanced bootstraps

     

       42
       42
       +
       from the training set (one bootstrap for the positive class,

     

       43
       43
       +
       one for the negative class).

     

       44
       44
       +
       The size of the bootstrap is the size of the smallest (under-represented)

     

       45
       45
       +
       class.

     

       46
       46
       +
       

     

       47
       47
       +
       usage: linwrap

     

       48
       48
       +
         -i <filename>: training set or DB to screen

     

       49
       49
       +
         [-o <filename>]: predictions output file

     

       50
       50
       +
         [-np <int>]: ncores

     

       51
       51
       +
         [-c <float>]: fix C

     

       52
       52
       +
         [-e <float>]: fix epsilon (for SVR);

     

       53
       53
       +
         (0 <= epsilon <= max_i(|y_i|))

     

       54
       54
       +
         [-w <float>]: fix w1

     

       55
       55
       +
         [--no-plot]: no gnuplot

     

       56
       56
       +
         [-k <int>]: number of bags for bagging (default=off)

     

       57
       57
       +
         [{-n|--NxCV} <int>]: folds of cross validation

     

       58
       58
       +
         [--mcc-scan]: MCC scan for a trained model (requires n>1)

     

       59
       59
       +
         also requires (c, w, k) to be known

     

       60
       60
       +
         [--seed <int>]: fix random seed

     

       61
       61
       +
         [-p <float>]: training set portion (in [0.0:1.0])

     

       62
       62
       +
         [--pairs]: read from .AP files (atom pairs; will offset feat. indexes by 1)

     

       63
       63
       +
         [--train <train.liblin>]: training set (overrides -p)

     

       64
       64
       +
         [--valid <valid.liblin>]: validation set (overrides -p)

     

       65
       65
       +
         [--test <test.liblin>]: test set (overrides -p)

     

       66
       66
       +
         [{-l|--load} <filename>]: prod. mode; use trained models

     

       67
       67
       +
         [{-s|--save} <filename>]: train. mode; save trained models

     

       68
       68
       +
         [-f]: force overwriting existing model file

     

       69
       69
       +
         [--scan-c]: scan for best C

     

       70
       70
       +
         [--scan-e <int>]: epsilon scan #steps for SVR

     

       71
       71
       +
         [--regr]: regression (SVR); also, implied by -e and --scan-e

     

       72
       72
       +
         [--scan-w]: scan weight to counter class imbalance

     

       73
       73
       +
         [--w-range <float>:<int>:<float>]: specific range for w

     

       74
       74
       +
         (semantic=start:nsteps:stop)

     

       75
       75
       +
         [--e-range <float>:<int>:<float>]: specific range for e

     

       76
       76
       +
         (semantic=start:nsteps:stop)

     

       77
       77
       +
         [--c-range <float,float,...>] explicit scan range for C 

     

       78
       78
       +
         (example='0.01,0.02,0.03')

     

       79
       79
       +
         [--k-range <int,int,...>] explicit scan range for k 

     

       80
       80
       +
         (example='1,2,3,5,10')

     

       81
       81
       +
         [--scan-k]: scan number of bags (advice: optim. k rather than w)

     

       82
       82
       +
       """

     

       83
       83
       +
       url {

     

       84
       84
       +
         src: "https://github.com/UnixJunkie/linwrap/archive/v9.1.5.tar.gz"

     

       85
       85
       +
         checksum: "md5=f59e8b0452a5bb33f0fe239e524b5b40"

     

       86
       86
       +
       }