···11+opam-version: "2.0"
22+maintainer: "unixjunkie@sdf.org"
33+authors: ["Francois Berenger"]
44+homepage: "https://github.com/UnixJunkie/oranger"
55+bug-reports: "https://github.com/UnixJunkie/oranger/issues"
66+dev-repo: "git+https://github.com/UnixJunkie/oranger.git"
77+license: "LGPL-2.1-only WITH OCaml-LGPL-linking-exception"
88+build: [
99+ ["dune" "build" "-p" name "-j" jobs]
1010+ ["tar" "xzf" "0.9.11.tar.gz"]
1111+ ["mkdir" "ranger-0.9.11/cpp_version/build"]
1212+ ["sh" "-c" "cd ranger-0.9.11/cpp_version/build && %{conf-cmake:cmd}% ../"]
1313+ [make "-C" "ranger-0.9.11/cpp_version/build"]
1414+]
1515+install: [
1616+ ["cp" "ranger-0.9.11/cpp_version/build/ranger" "%{bin}%/ml_rf_ranger"]
1717+]
1818+depends: [
1919+ "dune" {>= "1.0.0"}
2020+ "conf-cmake" {build}
2121+ "re" {>= "1.9.0"}
2222+ "dolog" {>= "6.0.0"}
2323+ "batteries" {>= "3.3.0"}
2424+ "minicli" {>= "5.0.2"}
2525+ "cpm" {>= "12.0.0"}
2626+ "line_oriented" {>= "1.0.0"}
2727+ "molenc" {>= "16.0.0"}
2828+ "parany" {>= "12.0.3"}
2929+]
3030+depopts: [
3131+ "conf-gnuplot"
3232+]
3333+synopsis: "OCaml wrapper for the ranger (C++) random forests implementation"
3434+description: """
3535+Ranger is run from the command line and data are exchanged via text files.
3636+This is quick and dirty, not a clean OCaml interface to ranger.
3737+The oranger_rfr program allows to train/test a random-forests regressor model.
3838+3939+$ oranger_rfr
4040+usage:
4141+oranger_rfr [-p <float>]: proportion of the (randomized) dataset
4242+ used to train (default=0.80)
4343+ [-np <int>]: max number of processes (default=1)
4444+ [-n <int>]: |RF|; default=100
4545+ [--mtry <float>]: proportion of randomly selected features
4646+ to use at each split (default=(sqrt(|features|))/|features|)
4747+ [--scan-mtry]: scan for best mtry in [0.001,0.002,0.005,...,1.0]
4848+ (incompatible with --mtry)
4949+ [--mtry-range <string>]: mtrys to test e.g. "0.001,0.002,0.005"
5050+ [-o <filename>]: output scores to file
5151+ [--train <train.txt>]: training set (overrides -p)
5252+ [--valid <valid.txt>]: validation set (overrides -p)
5353+ [--test <test.txt>]: test set (overrides -p)
5454+ [--NxCV <int>]: number of folds of cross validation
5555+ [--seed <int>: fix random seed]
5656+ [--no-regr-plot]: turn OFF regression plot
5757+ [--rec-plot]: turn ON REC curve
5858+ [--y-rand]: turn ON Y-randomization
5959+ [-s <filename>]: save model to file
6060+ [-l <filename>]: load model from file
6161+ [--max-feat <int>]: max feature id. (cf. end of encoding dict)
6262+ [-v]: verbose/debug mode
6363+ [-h|--help]: show this help message
6464+"""
6565+extra-source "0.9.11.tar.gz" {
6666+ src: "https://github.com/imbs-hl/ranger/archive/0.9.11.tar.gz"
6767+ checksum: "md5=cf770dfdde5ef250bfd561ef2b0758ee"
6868+}
6969+url {
7070+ src: "https://github.com/UnixJunkie/oranger/archive/v4.3.3.tar.gz"
7171+ checksum: "md5=0c6b40873ca79cd656f323a009050fa2"
7272+}