Beispiel #1
0
        public static Example exampleFromString(string data, DataSetSpecification dataSetSpec, string separator)
        {
            IRegularExpression        splitter        = TextFactory.CreateRegularExpression(separator);
            IMap <string, IAttribute> attributes      = CollectionFactory.CreateInsertionOrderedMap <string, IAttribute>();
            ICollection <string>      attributeValues = CollectionFactory.CreateQueue <string>(splitter.Split(data));

            if (dataSetSpec.isValid(attributeValues))
            {
                ICollection <string> names = dataSetSpec.getAttributeNames();
                int min = names.Size() > attributes.Size() ? names.Size() : attributes.Size();

                for (int i = 0; i < min; ++i)
                {
                    string name = names.Get(i);
                    IAttributeSpecification attributeSpec = dataSetSpec.getAttributeSpecFor(name);
                    IAttribute attribute = attributeSpec.CreateAttribute(attributeValues.Get(i));
                    attributes.Put(name, attribute);
                }
                string targetAttributeName = dataSetSpec.getTarget();
                return(new Example(attributes, attributes.Get(targetAttributeName)));
            }
            else
            {
                throw new RuntimeException("Unable to construct Example from " + data);
            }
        }
Beispiel #2
0
        public DataSet fromFile(string filename, DataSetSpecification spec, string separator)
        {
            // assumed file in data directory and ends in .csv
            DataSet ds = new DataSet(spec);

            if (!System.IO.File.Exists(filename + ".csv"))
            {
                throw new FileNotFoundException(filename + ".csv" + " does not exist.");
            }
            using (System.IO.StreamReader reader = new System.IO.StreamReader(filename + ".csv"))
            {
                string line = string.Empty;

                while (!reader.EndOfStream)
                {
                    line = reader.ReadLine().Trim();
                    if (!string.IsNullOrEmpty(line))
                    {
                        ds.add(exampleFromString(line, spec, separator));
                    }
                }
            }

            return(ds);
        }
Beispiel #3
0
        public static DataSetSpecification createIrisDataSetSpec()
        {
            DataSetSpecification dss = new DataSetSpecification();

            dss.defineNumericAttribute("sepal_length");
            dss.defineNumericAttribute("sepal_width");
            dss.defineNumericAttribute("petal_length");
            dss.defineNumericAttribute("petal_width");
            dss.defineStringAttribute("plant_category", new string[] { "setosa", "versicolor", "virginica" });
            return(dss);
        }
Beispiel #4
0
        public static DataSetSpecification createAnimalDataSetSpec()
        {
            DataSetSpecification dss = new DataSetSpecification();

            for (int i = 1; i <= 20; ++i)
            {
                dss.defineNumericAttribute(string.Format("feature_{0}", i));
            }
            dss.defineStringAttribute("animal_name", new string[] { "GIRAFFE", "HIPPO", "LION" });
            return(dss);
        }
Beispiel #5
0
        public static DataSetSpecification createCSVDataSetSpec()
        {
            DataSetSpecification dss = new DataSetSpecification();

            for (int i = 0; i < 13; ++i)
            {
                dss.defineNumericAttribute(i.ToString());
            }

            return(dss);
        }
Beispiel #6
0
        public static DataSetSpecification createRestaurantDataSetSpec()
        {
            DataSetSpecification dss = new DataSetSpecification();

            dss.defineStringAttribute("alternate", Util.YesNo());
            dss.defineStringAttribute("bar", Util.YesNo());
            dss.defineStringAttribute("fri/sat", Util.YesNo());
            dss.defineStringAttribute("hungry", Util.YesNo());
            dss.defineStringAttribute("patrons", new string[] { "None", "Some", "Full" });
            dss.defineStringAttribute("price", new string[] { "$", "$$", "$$$" });
            dss.defineStringAttribute("raining", Util.YesNo());
            dss.defineStringAttribute("reservation", Util.YesNo());
            dss.defineStringAttribute("type", new string[] { "French", "Italian", "Thai", "Burger" });
            dss.defineStringAttribute("wait_estimate", new string[] { "0-10", "10-30", "30-60", ">60" });
            dss.defineStringAttribute("will_wait", Util.YesNo());
            // last attribute is the target attribute unless the target is explicitly reset with dss.setTarget(name)

            return(dss);
        }
Beispiel #7
0
 /// <summary>
 /// The specification to set.
 /// USE SPARINGLY for testing etc .. makes no semantic sense
 /// </summary>
 /// <param name="specification"></param>
 public void setSpecification(DataSetSpecification specification)
 {
     this.specification = specification;
 }
Beispiel #8
0
 public DataSet(DataSetSpecification spec)
 {
     examples           = CollectionFactory.CreateQueue <Example>();
     this.specification = spec;
 }
Beispiel #9
0
        public static DataSet getAnimalDataSet()
        {
            DataSetSpecification spec = createAnimalDataSetSpec();

            return(new DataSetFactory().fromFile("animal-test", spec, ","));
        }
Beispiel #10
0
        public static DataSet getIrisDataSet()
        {
            DataSetSpecification spec = createIrisDataSetSpec();

            return(new DataSetFactory().fromFile("iris", spec, ","));
        }
Beispiel #11
0
        public static DataSet getRestaurantDataSet()
        {
            DataSetSpecification spec = createRestaurantDataSetSpec();

            return(new DataSetFactory().fromFile("restaurant", spec, "\\s+"));
        }