Item talk:Q66357

From geokb

{

 "USGS Publications Warehouse": {
   "schema": {
     "@context": "https://schema.org",
     "@type": "CreativeWork",
     "additionalType": "USGS Numbered Series",
     "name": "Cost-Benefit Analysis of Computer Resources for Machine Learning",
     "identifier": [
       {
         "@type": "PropertyValue",
         "propertyID": "USGS Publications Warehouse IndexID",
         "value": "ofr20071398",
         "url": "https://pubs.usgs.gov/publication/ofr20071398"
       },
       {
         "@type": "PropertyValue",
         "propertyID": "USGS Publications Warehouse Internal ID",
         "value": 80800
       },
       {
         "@type": "PropertyValue",
         "propertyID": "DOI",
         "value": "10.3133/ofr20071398",
         "url": "https://doi.org/10.3133/ofr20071398"
       }
     ],
     "inLanguage": "en",
     "isPartOf": [
       {
         "@type": "CreativeWorkSeries",
         "name": "Open-File Report"
       }
     ],
     "datePublished": "2007",
     "dateModified": "2012-02-02",
     "abstract": "Machine learning describes pattern-recognition algorithms - in this case, probabilistic neural networks (PNNs). These can be computationally intensive, in part because of the nonlinear optimizer, a numerical process that calibrates the PNN by minimizing a sum of squared errors. This report suggests efficiencies that are expressed as cost and benefit. The cost is computer time needed to calibrate the PNN, and the benefit is goodness-of-fit, how well the PNN learns the pattern in the data. There may be a point of diminishing returns where a further expenditure of computer resources does not produce additional benefits. Sampling is suggested as a cost-reduction strategy. One consideration is how many points to select for calibration and another is the geometric distribution of the points. The data points may be nonuniformly distributed across space, so that sampling at some locations provides additional benefit while sampling at other locations does not. A stratified sampling strategy can be designed to select more points in regions where they reduce the calibration error and fewer points in regions where they do not. Goodness-of-fit tests ensure that the sampling does not introduce bias. This approach is illustrated by statistical experiments for computing correlations between measures of roadless area and population density for the San Francisco Bay Area. The alternative to training efficiencies is to rely on high-performance computer systems. These may require specialized programming and algorithms that are optimized for parallel performance.",
     "description": "iv, 7 p.",
     "publisher": {
       "@type": "Organization",
       "name": "Geological Survey (U.S.)"
     },
     "author": [
       {
         "@type": "Person",
         "name": "Champion, Richard A. rchampio@usgs.gov",
         "givenName": "Richard A.",
         "familyName": "Champion",
         "email": "rchampio@usgs.gov"
       }
     ],
     "funder": [
       {
         "@type": "Organization",
         "name": "Western Geographic Science Center",
         "url": "https://www.usgs.gov/centers/western-geographic-science-center"
       }
     ]
   }
 },
 "OpenAlex": {
   "abstract_inverted_index": {
     "Machine": [
       0
     ],
     "learning": [
       1
     ],
     "describes": [
       2
     ],
     "pattern-recognition": [
       3
     ],
     "algorithms": [
       4,
       226
     ],
     "-": [
       5
     ],
     "in": [
       6,
       18,
       72,
       157,
       168
     ],
     "this": [
       7
     ],
     "case,": [
       8
     ],
     "probabilistic": [
       9
     ],
     "neural": [
       10
     ],
     "networks": [
       11
     ],
     "(PNNs).": [
       12
     ],
     "These": [
       13,
       220
     ],
     "can": [
       14,
       150
     ],
     "be": [
       15,
       77,
       125,
       151
     ],
     "computationally": [
       16
     ],
     "intensive,": [
       17
     ],
     "part": [
       19
     ],
     "because": [
       20
     ],
     "of": [
       21,
       36,
       80,
       87,
       118,
       196
     ],
     "the": [
       22,
       30,
       58,
       61,
       67,
       70,
       73,
       115,
       119,
       162,
       178,
       203
     ],
     "nonlinear": [
       23
     ],
     "optimizer,": [
       24
     ],
     "a": [
       25,
       34,
       78,
       84,
       99
     ],
     "numerical": [
       26
     ],
     "process": [
       27
     ],
     "that": [
       28,
       43,
       131,
       177,
       227
     ],
     "calibrates": [
       29
     ],
     "PNN": [
       31,
       68
     ],
     "by": [
       32,
       188
     ],
     "minimizing": [
       33
     ],
     "sum": [
       35
     ],
     "squared": [
       37
     ],
     "errors.": [
       38
     ],
     "This": [
       39,
       184
     ],
     "report": [
       40
     ],
     "suggests": [
       41
     ],
     "efficiencies": [
       42,
       212
     ],
     "are": [
       44,
       228
     ],
     "expressed": [
       45
     ],
     "as": [
       46,
       98
     ],
     "cost": [
       47,
       51
     ],
     "and": [
       48,
       60,
       112,
       165,
       199,
       225
     ],
     "benefit.": [
       49
     ],
     "The": [
       50,
       121,
       208
     ],
     "is": [
       52,
       63,
       96,
       104,
       114,
       186,
       213
     ],
     "computer": [
       53,
       88,
       218
     ],
     "time": [
       54
     ],
     "needed": [
       55
     ],
     "to": [
       56,
       108,
       153,
       210,
       214
     ],
     "calibrate": [
       57
     ],
     "PNN,": [
       59
     ],
     "benefit": [
       62,
       138
     ],
     "goodness-of-fit,": [
       64
     ],
     "how": [
       65,
       105
     ],
     "well": [
       66
     ],
     "learns": [
       69
     ],
     "pattern": [
       71
     ],
     "data.": [
       74
     ],
     "There": [
       75
     ],
     "may": [
       76,
       124,
       221
     ],
     "point": [
       79
     ],
     "diminishing": [
       81
     ],
     "returns": [
       82
     ],
     "where": [
       83,
       159,
       170
     ],
     "further": [
       85
     ],
     "expenditure": [
       86
     ],
     "resources": [
       89
     ],
     "does": [
       90,
       144,
       180
     ],
     "not": [
       91,
       181
     ],
     "produce": [
       92
     ],
     "additional": [
       93,
       137
     ],
     "benefits.": [
       94
     ],
     "Sampling": [
       95
     ],
     "suggested": [
       97
     ],
     "cost-reduction": [
       100
     ],
     "strategy.": [
       101
     ],
     "One": [
       102
     ],
     "consideration": [
       103
     ],
     "many": [
       106
     ],
     "points": [
       107,
       123,
       156,
       167
     ],
     "select": [
       109,
       154
     ],
     "for": [
       110,
       191,
       202,
       230
     ],
     "calibration": [
       111,
       163
     ],
     "another": [
       113
     ],
     "geometric": [
       116
     ],
     "distribution": [
       117
     ],
     "points.": [
       120
     ],
     "data": [
       122
     ],
     "nonuniformly": [
       126
     ],
     "distributed": [
       127
     ],
     "across": [
       128
     ],
     "space,": [
       129
     ],
     "so": [
       130
     ],
     "sampling": [
       132,
       140,
       148,
       179
     ],
     "at": [
       133,
       141
     ],
     "some": [
       134
     ],
     "locations": [
       135,
       143
     ],
     "provides": [
       136
     ],
     "while": [
       139
     ],
     "other": [
       142
     ],
     "not.": [
       145,
       173
     ],
     "A": [
       146
     ],
     "stratified": [
       147
     ],
     "strategy": [
       149
     ],
     "designed": [
       152
     ],
     "more": [
       155
     ],
     "regions": [
       158,
       169
     ],
     "they": [
       160,
       171
     ],
     "reduce": [
       161
     ],
     "error": [
       164
     ],
     "fewer": [
       166
     ],
     "do": [
       172
     ],
     "Goodness-of-fit": [
       174
     ],
     "tests": [
       175
     ],
     "ensure": [
       176
     ],
     "introduce": [
       182
     ],
     "bias.": [
       183
     ],
     "approach": [
       185
     ],
     "illustrated": [
       187
     ],
     "statistical": [
       189
     ],
     "experiments": [
       190
     ],
     "computing": [
       192
     ],
     "correlations": [
       193
     ],
     "between": [
       194
     ],
     "measures": [
       195
     ],
     "roadless": [
       197
     ],
     "area": [
       198
     ],
     "population": [
       200
     ],
     "density": [
       201
     ],
     "San": [
       204
     ],
     "Francisco": [
       205
     ],
     "Bay": [
       206
     ],
     "Area.": [
       207
     ],
     "alternative": [
       209
     ],
     "training": [
       211
     ],
     "rely": [
       215
     ],
     "on": [
       216
     ],
     "high-performance": [
       217
     ],
     "systems.": [
       219
     ],
     "require": [
       222
     ],
     "specialized": [
       223
     ],
     "programming": [
       224
     ],
     "optimized": [
       229
     ],
     "parallel": [
       231
     ],
     "performance.": [
       232
     ]
   },
   "apc_list": null,
   "apc_paid": null,
   "authorships": [
     {
       "author_position": "first",
       "author": {
         "id": "https://openalex.org/A5088522093",
         "display_name": "Richard A. Champion",
         "orcid": null
       },
       "institutions": [],
       "countries": [],
       "is_corresponding": true,
       "raw_author_name": "Richard A. Champion",
       "raw_affiliation_strings": [],
       "affiliations": []
     }
   ],
   "best_oa_location": {
     "is_oa": true,
     "landing_page_url": "https://doi.org/10.3133/ofr20071398",
     "pdf_url": "https://pubs.usgs.gov/of/2007/1398/of2007-1398.pdf",
     "source": {
       "id": "https://openalex.org/S4210194219",
       "display_name": "Antarctica A Keystone in a Changing World",
       "issn_l": "0196-1497",
       "issn": [
         "0196-1497",
         "2331-1258",
         "2332-4899"
       ],
       "is_oa": true,
       "is_in_doaj": false,
       "is_core": true,
       "host_organization": "https://openalex.org/P4310316088",
       "host_organization_name": "United States Department of the Interior",
       "host_organization_lineage": [
         "https://openalex.org/P4310316088"
       ],
       "host_organization_lineage_names": [
         "United States Department of the Interior"
       ],
       "type": "journal"
     },
     "license": null,
     "license_id": null,
     "version": "publishedVersion",
     "is_accepted": true,
     "is_published": true
   },
   "biblio": {
     "volume": null,
     "issue": null,
     "first_page": null,
     "last_page": null
   },
   "citation_normalized_percentile": null,
   "cited_by_api_url": "https://api.openalex.org/works?filter=cites:W1541939501",
   "cited_by_count": 0,
   "cited_by_percentile_year": {
     "min": 0,
     "max": 65
   },
   "concepts": [
     {
       "id": "https://openalex.org/c140779682",
       "wikidata": "https://www.wikidata.org/wiki/Q210868",
       "display_name": "Sampling (signal processing)",
       "level": 3,
       "score": 0.7065876,
       "qid": null
     },
     {
       "id": "https://openalex.org/c41008148",
       "wikidata": "https://www.wikidata.org/wiki/Q21198",
       "display_name": "Computer science",
       "level": 0,
       "score": 0.63706875,
       "qid": "Q158969"
     },
     {
       "id": "https://openalex.org/c165838908",
       "wikidata": "https://www.wikidata.org/wiki/Q736777",
       "display_name": "Calibration",
       "level": 2,
       "score": 0.5806644,
       "qid": null
     },
     {
       "id": "https://openalex.org/c132480984",
       "wikidata": "https://www.wikidata.org/wiki/Q2034239",
       "display_name": "Goodness of fit",
       "level": 2,
       "score": 0.5141909,
       "qid": null
     },
     {
       "id": "https://openalex.org/c50644808",
       "wikidata": "https://www.wikidata.org/wiki/Q192776",
       "display_name": "Artificial neural network",
       "level": 2,
       "score": 0.47590336,
       "qid": null
     },
     {
       "id": "https://openalex.org/c49937458",
       "wikidata": "https://www.wikidata.org/wiki/Q2599292",
       "display_name": "Probabilistic logic",
       "level": 2,
       "score": 0.46213454,
       "qid": null
     },
     {
       "id": "https://openalex.org/c2908647359",
       "wikidata": "https://www.wikidata.org/wiki/Q2625603",
       "display_name": "Population",
       "level": 2,
       "score": 0.44717312,
       "qid": null
     },
     {
       "id": "https://openalex.org/c98045186",
       "wikidata": "https://www.wikidata.org/wiki/Q205663",
       "display_name": "Process (computing)",
       "level": 2,
       "score": 0.44580212,
       "qid": null
     },
     {
       "id": "https://openalex.org/c28719098",
       "wikidata": "https://www.wikidata.org/wiki/Q44946",
       "display_name": "Point (geometry)",
       "level": 2,
       "score": 0.43530294,
       "qid": null
     },
     {
       "id": "https://openalex.org/c124101348",
       "wikidata": "https://www.wikidata.org/wiki/Q172491",
       "display_name": "Data mining",
       "level": 1,
       "score": 0.43499374,
       "qid": "Q226221"
     },
     {
       "id": "https://openalex.org/c119857082",
       "wikidata": "https://www.wikidata.org/wiki/Q2539",
       "display_name": "Machine learning",
       "level": 1,
       "score": 0.3959587,
       "qid": "Q169132"
     },
     {
       "id": "https://openalex.org/c154945302",
       "wikidata": "https://www.wikidata.org/wiki/Q11660",
       "display_name": "Artificial intelligence",
       "level": 1,
       "score": 0.38819668,
       "qid": "Q166116"
     },
     {
       "id": "https://openalex.org/c126255220",
       "wikidata": "https://www.wikidata.org/wiki/Q141495",
       "display_name": "Mathematical optimization",
       "level": 1,
       "score": 0.3345007,
       "qid": "Q226264"
     },
     {
       "id": "https://openalex.org/c105795698",
       "wikidata": "https://www.wikidata.org/wiki/Q12483",
       "display_name": "Statistics",
       "level": 1,
       "score": 0.32348424,
       "qid": "Q161190"
     },
     {
       "id": "https://openalex.org/c33923547",
       "wikidata": "https://www.wikidata.org/wiki/Q395",
       "display_name": "Mathematics",
       "level": 0,
       "score": 0.13900715,
       "qid": "Q161189"
     },
     {
       "id": "https://openalex.org/c111919701",
       "wikidata": "https://www.wikidata.org/wiki/Q9135",
       "display_name": "Operating system",
       "level": 1,
       "score": 0.0,
       "qid": "Q226285"
     },
     {
       "id": "https://openalex.org/c149923435",
       "wikidata": "https://www.wikidata.org/wiki/Q37732",
       "display_name": "Demography",
       "level": 1,
       "score": 0.0,
       "qid": "Q166262"
     },
     {
       "id": "https://openalex.org/c2524010",
       "wikidata": "https://www.wikidata.org/wiki/Q8087",
       "display_name": "Geometry",
       "level": 1,
       "score": 0.0,
       "qid": "Q226246"
     },
     {
       "id": "https://openalex.org/c106131492",
       "wikidata": "https://www.wikidata.org/wiki/Q3072260",
       "display_name": "Filter (signal processing)",
       "level": 2,
       "score": 0.0,
       "qid": null
     },
     {
       "id": "https://openalex.org/c144024400",
       "wikidata": "https://www.wikidata.org/wiki/Q21201",
       "display_name": "Sociology",
       "level": 0,
       "score": 0.0,
       "qid": "Q226182"
     },
     {
       "id": "https://openalex.org/c31972630",
       "wikidata": "https://www.wikidata.org/wiki/Q844240",
       "display_name": "Computer vision",
       "level": 1,
       "score": 0.0,
       "qid": "Q166180"
     }
   ],
   "corresponding_author_ids": [
     "https://openalex.org/A5088522093"
   ],
   "corresponding_institution_ids": [],
   "countries_distinct_count": 0,
   "counts_by_year": [],
   "created_date": "2016-06-24",
   "datasets": [],
   "display_name": "Cost-Benefit Analysis of Computer Resources for Machine Learning",
   "doi": "https://doi.org/10.3133/ofr20071398",
   "fwci": 0.0,
   "grants": [],
   "has_fulltext": false,
   "id": "https://openalex.org/W1541939501",
   "ids": {
     "openalex": "https://openalex.org/W1541939501",
     "doi": "https://doi.org/10.3133/ofr20071398",
     "mag": "1541939501"
   },
   "indexed_in": [
     "crossref"
   ],
   "institutions_distinct_count": 0,
   "is_paratext": false,
   "is_retracted": false,
   "keywords": [
     {
       "id": "https://openalex.org/keywords/robust-learning",
       "display_name": "Robust Learning",
       "score": 0.578965
     },
     {
       "id": "https://openalex.org/keywords/machine-learning",
       "display_name": "Machine Learning",
       "score": 0.537226
     },
     {
       "id": "https://openalex.org/keywords/meta-learning",
       "display_name": "Meta-Learning",
       "score": 0.533675
     },
     {
       "id": "https://openalex.org/keywords/pattern-classification",
       "display_name": "Pattern Classification",
       "score": 0.529402
     },
     {
       "id": "https://openalex.org/keywords/backpropagation-learning",
       "display_name": "Backpropagation Learning",
       "score": 0.529376
     },
     {
       "id": "https://openalex.org/keywords/goodness-of-fit",
       "display_name": "Goodness of fit",
       "score": 0.5141909
     }
   ],
   "language": "en",
   "locations": [
     {
       "is_oa": true,
       "landing_page_url": "https://doi.org/10.3133/ofr20071398",
       "pdf_url": "https://pubs.usgs.gov/of/2007/1398/of2007-1398.pdf",
       "source": {
         "id": "https://openalex.org/S4210194219",
         "display_name": "Antarctica A Keystone in a Changing World",
         "issn_l": "0196-1497",
         "issn": [
           "0196-1497",
           "2331-1258",
           "2332-4899"
         ],
         "is_oa": true,
         "is_in_doaj": false,
         "is_core": true,
         "host_organization": "https://openalex.org/P4310316088",
         "host_organization_name": "United States Department of the Interior",
         "host_organization_lineage": [
           "https://openalex.org/P4310316088"
         ],
         "host_organization_lineage_names": [
           "United States Department of the Interior"
         ],
         "type": "journal"
       },
       "license": null,
       "license_id": null,
       "version": "publishedVersion",
       "is_accepted": true,
       "is_published": true
     }
   ],
   "locations_count": 1,
   "mesh": [],
   "ngrams_url": "https://api.openalex.org/works/W1541939501/ngrams",
   "open_access": {
     "is_oa": true,
     "oa_status": "bronze",
     "oa_url": "https://pubs.usgs.gov/of/2007/1398/of2007-1398.pdf",
     "any_repository_has_fulltext": false
   },
   "primary_location": {
     "is_oa": true,
     "landing_page_url": "https://doi.org/10.3133/ofr20071398",
     "pdf_url": "https://pubs.usgs.gov/of/2007/1398/of2007-1398.pdf",
     "source": {
       "id": "https://openalex.org/S4210194219",
       "display_name": "Antarctica A Keystone in a Changing World",
       "issn_l": "0196-1497",
       "issn": [
         "0196-1497",
         "2331-1258",
         "2332-4899"
       ],
       "is_oa": true,
       "is_in_doaj": false,
       "is_core": true,
       "host_organization": "https://openalex.org/P4310316088",
       "host_organization_name": "United States Department of the Interior",
       "host_organization_lineage": [
         "https://openalex.org/P4310316088"
       ],
       "host_organization_lineage_names": [
         "United States Department of the Interior"
       ],
       "type": "journal"
     },
     "license": null,
     "license_id": null,
     "version": "publishedVersion",
     "is_accepted": true,
     "is_published": true
   },
   "primary_topic": {
     "id": "https://openalex.org/T12814",
     "display_name": "Gaussian Processes in Machine Learning",
     "score": 0.9975,
     "subfield": {
       "id": "https://openalex.org/subfields/1702",
       "display_name": "Artificial Intelligence"
     },
     "field": {
       "id": "https://openalex.org/fields/17",
       "display_name": "Computer Science"
     },
     "domain": {
       "id": "https://openalex.org/domains/3",
       "display_name": "Physical Sciences"
     }
   },
   "publication_date": "2007-01-01",
   "publication_year": 2007,
   "referenced_works": [
     "https://openalex.org/W1486587513",
     "https://openalex.org/W1514027835",
     "https://openalex.org/W1533618852",
     "https://openalex.org/W1663973292",
     "https://openalex.org/W1982647060",
     "https://openalex.org/W2009086942",
     "https://openalex.org/W2047278710",
     "https://openalex.org/W2085344466",
     "https://openalex.org/W2117897510",
     "https://openalex.org/W2132536544",
     "https://openalex.org/W2171033594",
     "https://openalex.org/W2184111892",
     "https://openalex.org/W2535756153",
     "https://openalex.org/W292065152",
     "https://openalex.org/W3189823449",
     "https://openalex.org/W4232383088",
     "https://openalex.org/W4233034972",
     "https://openalex.org/W4244777963",
     "https://openalex.org/W4285719527",
     "https://openalex.org/W4301264738"
   ],
   "referenced_works_count": 20,
   "related_works": [
     "https://openalex.org/W4226213673",
     "https://openalex.org/W4206658415",
     "https://openalex.org/W3167233239",
     "https://openalex.org/W2995459153",
     "https://openalex.org/W2621433169",
     "https://openalex.org/W2493307909",
     "https://openalex.org/W2372709328",
     "https://openalex.org/W2097522327",
     "https://openalex.org/W2050686036",
     "https://openalex.org/W1541538682"
   ],
   "sustainable_development_goals": [],
   "title": "Cost-Benefit Analysis of Computer Resources for Machine Learning",
   "topics": [
     {
       "id": "https://openalex.org/T12814",
       "display_name": "Gaussian Processes in Machine Learning",
       "score": 0.9975,
       "subfield": {
         "id": "https://openalex.org/subfields/1702",
         "display_name": "Artificial Intelligence"
       },
       "field": {
         "id": "https://openalex.org/fields/17",
         "display_name": "Computer Science"
       },
       "domain": {
         "id": "https://openalex.org/domains/3",
         "display_name": "Physical Sciences"
       }
     },
     {
       "id": "https://openalex.org/T12535",
       "display_name": "Learning with Noisy Labels in Machine Learning",
       "score": 0.9851,
       "subfield": {
         "id": "https://openalex.org/subfields/1702",
         "display_name": "Artificial Intelligence"
       },
       "field": {
         "id": "https://openalex.org/fields/17",
         "display_name": "Computer Science"
       },
       "domain": {
         "id": "https://openalex.org/domains/3",
         "display_name": "Physical Sciences"
       }
     },
     {
       "id": "https://openalex.org/T10320",
       "display_name": "Neural Network Fundamentals and Applications",
       "score": 0.9825,
       "subfield": {
         "id": "https://openalex.org/subfields/1702",
         "display_name": "Artificial Intelligence"
       },
       "field": {
         "id": "https://openalex.org/fields/17",
         "display_name": "Computer Science"
       },
       "domain": {
         "id": "https://openalex.org/domains/3",
         "display_name": "Physical Sciences"
       }
     }
   ],
   "type": "article",
   "type_crossref": "journal-article",
   "updated_date": "2024-08-10T09:22:11.163528",
   "versions": [],
   "qid": "Q66357"
 }

}