72 return( Value * Value );
92 return( floor(0.5 + Value) );
95 double d = pow(10., Decimals);
98 if( fabs(v - floor(v)) > 0. )
100 return( floor(0.5 + v) / d );
109 if( Decimals <= 0 || Value == 0. )
111 return( (
int)(0.5 + Value) );
114 Decimals = (int)(-(ceil(log10(fabs(Value))) - Decimals));
118 double d = pow(10., Decimals);
121 ? -((
int)(0.5 - Value * d)) / d
122 : ((
int)(0.5 + Value * d)) / d
127 double d = pow(10., -Decimals);
130 ? -((
int)(0.5 - Value / d)) * d
131 : ((
int)(0.5 + Value / d)) * d
146 Number = abs(Number);
148 return( Number < 10 ? 1 : 1 + (
int)log10((
double)Number) );
163 if( Width > 0 && Precision >= 0 )
return(
CSG_String::Format(
"%*.*e", Width, Precision, Number) );
171 if( Width > 0 && Precision >= 0 )
return(
CSG_String::Format(
"%*.*f", Width, Precision, Number) );
189 if( *((
int *)a) < *((
int *)b) )
192 if( *((
int *)a) > *((
int *)b) )
201 if( *((
double *)a) < *((
double *)b) )
204 if( *((
double *)a) > *((
double *)b) )
213 return( strcmp((
const char *)a, (
const char *)b) );
226 if( Deg < 0. ) { Min = -fabs(Min); Sec = -fabs(Sec); }
228 return( Deg + Min / 60. + Sec / 3600. );
234 Sec = fmod(Value < 0. ? -Value : Value, 360.);
236 Deg = (int)Sec; Sec = 60. * (Sec - Deg);
237 Min = (int)Sec; Sec = 60. * (Sec - Min);
275 return( 1. * rand() / (
double)RAND_MAX );
283 return( min + (max - min) * rand() / (
double)RAND_MAX );
306 w = x1 * x1 + x2 * x2;
310 w = sqrt((-2. * log(w)) / w);
312 return( mean + stddev * x1 * w );
340 Create(Mean, StdDev, Count);
345 Create(Values, bHoldValues);
430 double Scale = nValues / (double)
m_nValues;
544 m_Sum += Weight * Value;
545 m_Sum2 += Weight * Value*Value;
632 if( Quantile <= 0. ||
m_Values.Get_Size() == 1 )
643 double r = Quantile * (
m_Values.Get_Size() - 1);
711 if(
m_Values.Get_Size() == 0 ) {
return( -1 ); }
716 for(
size_t i=1; i<(size_t)
m_Values.Get_Size(); i++)
725 return( (
sLong)Index );
735 if(
m_Values.Get_Size() == 0 ) {
return( -1 ); }
740 for(
size_t i=1; i<(size_t)
m_Values.Get_Size(); i++)
749 return( (
sLong)Index );
759 if(
m_Values.Get_Size() == 0 ) {
return( -1 ); }
781 if(
m_Values.Get_Size() == 0 ) {
return( -1 ); }
878 if( Value == m_Value[i] )
892 m_Value.Add_Row(Value);
905 if( Value == m_Value[i] )
933 if( Value.
Cmp(m_Value[i]) == 0 )
960 if( Value.
Cmp(m_Value[i]) == 0 )
995 m_pTable->Add_Field(
"VALUE", Type);
1002 m_pTable->Del_Records();
1008 return( m_pTable->Get_Field_Type(0) );
1021 return( pRecord ? (
int)pRecord->
Get_Index() : -1);
1029 return( pRecord ? (
int)pRecord->
Get_Index() : -1);
1037 return( pRecord ? (
int)pRecord->
Get_Index() : -1);
1052 (pRecord = m_pTable->Add_Record())->Set_Value(0, Value);
1054 if( m_pTable->Get_Count() > 16 || m_pTable->is_Indexed() )
1062 return( (
int)(m_pTable->Get_Count() - 1) );
1072 (pRecord = m_pTable->Add_Record())->Set_Value(0, Value);
1074 if( m_pTable->Get_Count() > 16 || m_pTable->is_Indexed() )
1082 return( (
int)(m_pTable->Get_Count() - 1) );
1092 (pRecord = m_pTable->Add_Record())->Set_Value(0, Value);
1094 if( m_pTable->Get_Count() > 16 || m_pTable->is_Indexed() )
1102 return( (
int)(m_pTable->Get_Count() - 1) );
1113 for(
sLong i=0; i<m_pTable->Get_Count(); i++)
1133 return( (
int)m_pTable->Get_Count() );
1142 return( pRecord ? pRecord->
asInt(1) : 0 );
1150 return( pRecord ? pRecord->
asInt(0) : 0 );
1158 return( pRecord ? pRecord->
asDouble(0) : 0 );
1177 if( m_pTable->Get_Count() > 0 )
1179 int Index = 0, Count = m_pTable->Get_Record_byIndex(0)->asInt(1);
1181 for(
int i=1; i<m_pTable->Get_Count(); i++)
1183 if( Count < m_pTable->Get_Record_byIndex(i)->
asInt(1) )
1185 Index = i; Count = m_pTable->Get_Record_byIndex(i)->asInt(1);
1198 if( m_pTable->Get_Count() > 0 )
1200 int Index = 0, Count = m_pTable->Get_Record_byIndex(0)->asInt(1);
1202 for(
int i=1; i<m_pTable->Get_Count(); i++)
1204 if( Count > m_pTable->Get_Record_byIndex(i)->asInt(1) )
1206 Index = i; Count = m_pTable->Get_Record_byIndex(i)->asInt(1);
1286 m_Statistics.Create();
1302void CSG_Histogram::_On_Construction(
void)
1306 m_Cumulative = NULL;
1313bool CSG_Histogram::_Create(
size_t nClasses,
double Minimum,
double Maximum)
1319 m_Elements = (
size_t *)
SG_Calloc(nClasses,
sizeof(
size_t));
1320 m_Cumulative = (
size_t *)
SG_Calloc(nClasses,
sizeof(
size_t));
1322 if( m_Elements && m_Cumulative )
1324 m_nClasses = nClasses;
1341 m_Statistics += Value;
1343 if( m_nClasses > 0 && m_Minimum <= Value && Value <= m_Maximum )
1345 size_t Class = (size_t)((Value - m_Minimum) / m_ClassWidth);
1347 if( Class >= m_nClasses )
1349 Class = m_nClasses - 1;
1352 m_Elements[Class]++;
1359 if( m_nClasses > 0 && Scale > 0. )
1363 for(
size_t i=0; i<m_nClasses; i++)
1365 m_Elements[i] = (size_t)(Scale * m_Elements[i]);
1377 if( m_nClasses > 0 )
1379 m_Statistics.Get_Mean();
1381 m_nMaximum = m_Cumulative[0] = m_Elements[0];
1383 for(
size_t i=1; i<m_nClasses; i++)
1385 m_Cumulative[i] = m_Cumulative[i - 1] + m_Elements[i];
1387 if( m_nMaximum < m_Elements[i] )
1389 m_nMaximum = m_Elements[i];
1400bool CSG_Histogram::_Update(
sLong nElements)
1402 if( nElements > 0 && m_Statistics.
Get_Count() > 0 )
1404 double Scale = (double)nElements / (
double)m_Statistics.
Get_Count();
1408 for(
size_t i=1; i<m_nClasses; i++)
1410 m_Elements[i] = (size_t)(0.5 + Scale * m_Elements[i]);
1420 || m_nClasses != Histogram.m_nClasses
1421 || m_Minimum != Histogram.m_Minimum
1422 || m_Maximum != Histogram.m_Maximum )
1427 m_Statistics += Histogram.m_Statistics;
1429 for(
size_t i=0; i<m_nClasses; i++ )
1431 m_Elements[i] += Histogram.m_Elements[i];
1443 if( m_nClasses < 2 ) {
return( 0. ); }
1445 if( Quantile <= 0. ) {
return( m_Minimum ); }
1446 if( Quantile >= 1. ) {
return( m_Maximum ); }
1450 for(
size_t i=0, n0=0; i<m_nClasses; n0=m_Cumulative[i++])
1452 if( n < m_Cumulative[i] )
1454 if( m_Cumulative[i] >= n0 )
1459 double d = (n - n0) / (
double)(m_Cumulative[i] - n0);
1461 return(
Get_Break(i) + d * m_ClassWidth );
1463 else if( n == m_Cumulative[i] )
1469 return( m_Maximum );
1487 if( m_nClasses < 2 ) {
return( 0. ); }
1489 if( Value <= m_Minimum ) {
return( 0. ); }
1490 if( Value >= m_Maximum ) {
return( 1. ); }
1492 size_t Class = (size_t)(m_nClasses * (Value - m_Minimum) / (m_Maximum - m_Minimum));
1494 if( Class >= m_nClasses )
1503 return( dq * (Value - m_Minimum) / m_ClassWidth );
1509 return( q0 + dq * (Value -
Get_Break(Class)) / m_ClassWidth );
1529 if( !_Create(Histogram.m_nClasses, Histogram.m_Minimum, Histogram.m_Maximum) )
1534 m_Statistics = Histogram.m_Statistics;
1535 m_ClassWidth = Histogram.m_ClassWidth;
1536 m_nMaximum = Histogram.m_nMaximum ;
1538 for(
size_t i=0; i<m_nClasses; i++)
1540 m_Cumulative[i] = Histogram.m_Cumulative[i];
1541 m_Elements [i] = Histogram.m_Elements [i];
1570 if( maxSamples > 0 && maxSamples < (
size_t)Values.
Get_N() )
1572 double d = (double)Values.
Get_N() / (double)maxSamples;
1574 for(
double i=0; i<(double)Values.
Get_N(); i+=d)
1579 d = (double)m_Statistics.Get_Count() / (double)maxSamples;
1581 return( _Update(d < 1. ? (
int)(d * (
double)Values.
Get_N()) : Values.
Get_N()) );
1585 for(
int i=0; i<Values.
Get_N(); i++)
1596 if( !pTable || Field < 0 || Field >= pTable->
Get_Field_Count() || !_Create(nClasses,
1604 if( maxSamples > 0 && maxSamples < (
size_t)pTable->
Get_Count() )
1606 double Value, Dividend, d = (double)pTable->
Get_Count() / (double)maxSamples;
1608 for(
double i=0; i<(double)pTable->
Get_Count(); i+=d)
1616 else if( pTable->
Get_Value((
sLong)i, Normalize, Dividend) && Dividend != 0. )
1623 d = (double)m_Statistics.Get_Count() / (double)maxSamples;
1631 double Value, Dividend;
1633 if( pTable->
Get_Value(i, Field, Value) )
1639 else if( pTable->
Get_Value((
sLong)i, Normalize, Dividend) && Dividend != 0. )
1652 if( !pGrid || !_Create(nClasses,
1660 if( maxSamples > 0 && (
sLong)maxSamples < pGrid->Get_NCells() )
1662 double d = (double)pGrid->
Get_NCells() / (double)maxSamples;
1664 for(
double i=0; i<(double)pGrid->
Get_NCells(); i+=d)
1672 d = (double)m_Statistics.Get_Count() / (double)maxSamples;
1692 if( !pGrids || !_Create(nClasses,
1700 if( maxSamples > 0 && (
sLong)maxSamples < pGrids->Get_NCells() )
1702 double d = (double)pGrids->
Get_NCells() / (double)maxSamples;
1704 for(
double i=0; i<(double)pGrids->
Get_NCells(); i+=d)
1712 d = (double)m_Statistics.Get_Count() / (double)maxSamples;
1760 Create(pTable, Field, nClasses, Histogram);
1766 Create(pGrid, nClasses, Histogram);
1772 Create(pGrids, nClasses, Histogram);
1778 Create(Values, nClasses, Histogram);
1789 bool bResult =
false;
1793 bResult = m_Histogram.Create(Histogram, pTable, Field) && _Histogram(nClasses);
1795 else if( Field >= 0 && Field < pTable->Get_Field_Count() )
1801 if( pTable->
Get_Value(i, Field, Value) )
1803 m_Values.Add_Row(Value);
1807 bResult = m_Values.Sort() && _Calculate(nClasses);
1818 bool bResult =
false;
1822 bResult = m_Histogram.Create(Histogram, pGrid) && _Histogram(nClasses);
1830 m_Values.Add_Row(pGrid->
asDouble(i));
1834 bResult = m_Values.Sort() && _Calculate(nClasses);
1845 bool bResult =
false;
1849 bResult = m_Histogram.Create(Histogram, pGrids) && _Histogram(nClasses);
1857 m_Values.Add_Row(pGrids->
asDouble(i));
1861 bResult = m_Values.Sort() && _Calculate(nClasses);
1872 bool bResult =
false;
1876 bResult = m_Histogram.Create(Histogram, Values) && _Histogram(nClasses);
1880 bResult = m_Values.Create(Values) && m_Values.Sort() && _Calculate(nClasses);
1894bool CSG_Natural_Breaks::_Histogram(
int nClasses)
1896 if( _Calculate(nClasses) )
1904 m_Breaks[i] = m_Histogram.
Get_Value(m_Breaks[i] * d);
1907 m_Breaks[nClasses] = m_Histogram.Get_Break((
int)m_Histogram.Get_Class_Count());
1909 m_Histogram.Destroy();
1914 m_Histogram.Destroy();
1920inline double CSG_Natural_Breaks::_Get_Value(
int i)
1922 if( m_Histogram.Get_Class_Count() > 0 )
1924 return( (
double)m_Histogram.Get_Cumulative(i) );
1927 return( m_Values[i] );
1931bool CSG_Natural_Breaks::_Calculate(
int nClasses)
1933 if( m_Histogram.Get_Class_Count() == 0 && m_Values.Get_Size() == 0 )
1938 int nValues = m_Histogram.Get_Class_Count() > 0 ? (int)m_Histogram.Get_Class_Count() : m_Values.Get_N();
1940 CSG_Matrix mv(nClasses, nValues); mv.Assign(FLT_MAX);
1942 int **mc = (
int **)
SG_Malloc(nValues *
sizeof(
int *));
1944 mc[0] = (
int *)
SG_Calloc((
size_t)nClasses * nValues,
sizeof(
int));
1946 for(
int i=0; i<nValues; i++)
1948 mc[i] = mc[0] + i * (size_t)nClasses;
1952 for(
int i=1; i<nValues; i++)
1954 double v = 0., s1 = 0., s2 = 0., w = 0.;
1956 for(
int m=0, n=i+1; m<=i; m++, n--)
1962 v = s2 - (s1 * s1) / w;
1966 for(
int j=1; j<nClasses; j++)
1968 if( mv[i][j] >= (v + mv[n - 1][j - 1]) )
1971 mv[i][j] = v + mv[n - 1][j - 1];
1982 CSG_Array_Int Class(nClasses);
1984 for(
int i=0; i<nClasses; i++)
1989 int j = Class[(size_t)nClasses - 1] = nValues - 1;
1991 for(
int i=nClasses-1; i>0; i--)
1993 Class[(size_t)i - 1] = j = mc[j - 1][i];
1997 m_Breaks.Create((
size_t)nClasses + 1);
1999 m_Breaks[0] = _Get_Value(0);
2001 for(
int i=1; i<nClasses; i++)
2003 m_Breaks[i] = _Get_Value(Class[i - 1]);
2006 m_Breaks[nClasses] = _Get_Value(nValues - 1);
2036 m_Centroid.Destroy();
2037 m_Variance.Destroy();
2038 m_nMembers.Destroy();
2039 m_Clusters.Destroy();
2040 m_Features.Destroy();
2054 m_nFeatures = nFeatures;
2067 return( m_nFeatures > 0 && m_Features.Inc_Array() );
2073 if( iElement >= 0 && iElement <
Get_nElements() && iFeature >= 0 && iFeature < m_nFeatures )
2075 ((
double *)m_Features.Get_Entry(iElement))[iFeature] = Value;
2102 m_nMembers.Create(nClusters);
2103 m_Variance.Create(nClusters);
2104 m_Centroid.Create(m_nFeatures, nClusters);
2111 switch( Initialization )
2116 m_Clusters[iElement] = nClusters - 1;
2122 m_Clusters[iElement] = iElement % nClusters;
2127 if( 0 > m_Clusters[iElement] || m_Clusters[iElement] >= nClusters )
2129 m_Clusters[iElement] = iElement % nClusters;
2142 default: bResult = _Minimum_Distance(
true , nMaxIterations);
break;
2143 case 1: bResult = _Hill_Climbing (
true , nMaxIterations);
break;
2144 case 2: bResult = _Minimum_Distance(
true , nMaxIterations)
2145 && _Hill_Climbing (
false, nMaxIterations);
break;
2151 for(
int iCluster=0; iCluster<nClusters; iCluster++)
2153 m_Variance[iCluster] = m_nMembers[iCluster] <= 0 ? 0. : m_Variance[iCluster] / m_nMembers[iCluster];
2161bool CSG_Cluster_Analysis::_Minimum_Distance(
bool bInitialize,
int nMaxIterations)
2163 int iElement, iCluster, nClusters = m_Variance.
Get_N();
2165 double SP_Last = -1.;
2177 m_nMembers[iCluster = m_Clusters[iElement]]++;
2179 double *Feature = (
double *)m_Features.
Get_Entry(iElement);
2181 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2183 m_Centroid[iCluster][iFeature] += Feature[iFeature];
2188 for(iCluster=0; iCluster<nClusters; iCluster++)
2190 double d = m_nMembers[iCluster] > 0 ? 1. / m_nMembers[iCluster] : 0.;
2192 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2194 m_Centroid[iCluster][iFeature] *= d;
2199 int nShifts = 0; m_SP = 0.;
2203 double *Feature = (
double *)m_Features.Get_Entry(iElement);
2205 double minVariance = -1.;
2206 int minCluster = -1;
2208 for(iCluster=0; iCluster<nClusters; iCluster++)
2210 double Variance = 0.;
2212 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2214 Variance +=
SG_Get_Square(m_Centroid[iCluster][iFeature] - Feature[iFeature]);
2217 if( minVariance < 0. || Variance < minVariance )
2219 minVariance = Variance;
2220 minCluster = iCluster;
2224 if( m_Clusters[iElement] != minCluster )
2226 m_Clusters[iElement] = minCluster;
2231 m_SP += minVariance;
2232 m_Variance[minCluster] += minVariance;
2239 _TL(
"pass" ), m_Iteration,
2240 _TL(
"change"), m_Iteration < 2 ? m_SP : SP_Last - m_SP
2245 if( nShifts == 0 || (nMaxIterations > 0 && nMaxIterations <= m_Iteration) )
2255bool CSG_Cluster_Analysis::_Hill_Climbing(
bool bInitialize,
int nMaxIterations)
2257 int iElement, iCluster, nClusters = m_Variance.Get_N();
2266 m_nMembers[iCluster = m_Clusters[iElement]]++;
2268 double *Feature = (
double *)m_Features.Get_Entry(iElement);
2270 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2272 double d = Feature[iFeature];
2274 m_Centroid[iCluster][iFeature] += d;
2275 m_Variance[iCluster] += d*d;
2280 for(iCluster=0; iCluster<nClusters; iCluster++)
2282 double v = 0., d = m_nMembers[iCluster] <= 0 ? 0. : 1. / (double)m_nMembers[iCluster];
2284 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2286 m_Centroid[iCluster][iFeature] *= d;
2290 m_Variance[iCluster] -= v * m_nMembers[iCluster];
2294 double SP_Last = -1.;
int noShift = 0;
2300 iCluster = m_Clusters[iElement];
2302 if( noShift++ <
Get_nElements() && m_nMembers[iCluster] > 1 )
2304 double *Feature = (
double *)m_Features.Get_Entry(iElement);
2306 double Variance = 0.;
2308 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2310 Variance +=
SG_Get_Square(m_Centroid[iCluster][iFeature] - Feature[iFeature]);
2313 double V1 = Variance * m_nMembers[iCluster] / (m_nMembers[iCluster] - 1.);
2316 int kCluster = 0;
double VMin = -1.;
2318 for(
int jCluster=0; jCluster<nClusters; jCluster++)
2320 if( jCluster != iCluster )
2324 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2326 Variance +=
SG_Get_Square(m_Centroid[jCluster][iFeature] - Feature[iFeature]);
2329 double V2 = Variance * m_nMembers[jCluster] / (m_nMembers[jCluster] + 1.);
2331 if( VMin < 0. || V2 < VMin )
2334 kCluster = jCluster;
2340 if( VMin >= 0 && VMin < V1 )
2343 m_Variance[iCluster] -= V1;
2344 m_Variance[kCluster] += VMin;
2345 V1 = 1. / (m_nMembers[iCluster] - 1.);
2346 double V2 = 1. / (m_nMembers[kCluster] + 1.);
2348 for(
int iFeature=0; iFeature<m_nFeatures; iFeature++)
2350 double d = Feature[iFeature];
2352 m_Centroid[iCluster][iFeature] = (m_nMembers[iCluster] * m_Centroid[iCluster][iFeature] - d) * V1;
2353 m_Centroid[kCluster][iFeature] = (m_nMembers[kCluster] * m_Centroid[kCluster][iFeature] + d) * V2;
2356 m_Clusters[iElement] = kCluster;
2358 m_nMembers[iCluster]--;
2359 m_nMembers[kCluster]++;
2365 for(iCluster=0, m_SP=0.; iCluster<nClusters; iCluster++)
2367 m_SP += m_Variance[iCluster];
2373 _TL(
"pass" ), m_Iteration,
2374 _TL(
"change"), m_Iteration <= 1 ? m_SP : SP_Last - m_SP
2379 if( noShift >=
Get_nElements() || (nMaxIterations > 0 && nMaxIterations <= m_Iteration) )
2398 m_nFeatures = 0; m_pClasses = NULL; m_nClasses = 0;
2400 m_Threshold_Distance = 0.;
2401 m_Threshold_Angle = 0.;
2402 m_Threshold_Probability = 0.;
2403 m_Probability_Relative =
false;
2427 m_nFeatures = nFeatures;
2434 if( m_nClasses > 0 )
2436 for(
int i=0; i<m_nClasses; i++)
2438 delete(m_pClasses[i]);
2475 m_bWTA[Method] = bOn;
2495 int nFeatures = m_nFeatures;
Destroy(); m_nFeatures = nFeatures;
2505 if( !Data(
"classes") || !Data(
"features") || !Data[
"features"](
"count") || Data[
"features"][
"count"].Get_Content().asInt() != m_nFeatures || m_nFeatures == 0 )
2510 if( Data[
"features"](
"info") )
2520 if( Classes[i].Cmp_Name(
"class") && Classes[i].Get_Child(
"id") )
2524 CClass *pClass =
new CClass(Classes[i][
"id"].Get_Content());
2538 m_pClasses = (CClass **)
SG_Realloc(m_pClasses, ((
size_t)m_nClasses + 1) *
sizeof(CClass *));
2539 m_pClasses[m_nClasses++] = pClass;
2549 return( m_nClasses > 0 );
2555 if( m_nFeatures < 1 || m_nClasses < 1 || File.
is_Empty() )
2562 Data.
Set_Name (
"supervised_classifier");
2567 Features.
Add_Child(
"count", m_nFeatures);
2569 if( Feature_Info && *Feature_Info )
2571 Features.
Add_Child(
"info", Feature_Info);
2578 for(
int i=0; i<m_nClasses; i++)
2582 CClass *pClass = m_pClasses[i];
2591 return( Data.
Save(File) );
2604 if( m_nFeatures > 0 && m_nClasses > 0 )
2608 for(
int iClass=0; iClass<m_nClasses; iClass++)
2610 CClass *pClass = m_pClasses[iClass];
2612 s +=
"\n____\n" + pClass->m_ID +
"\nFeature\tMean\tMin\tMax\tStdDev";
2614 for(
int i=0; i<m_nFeatures; i++)
2638 if( m_nFeatures < 1 || Mean.
Get_N() != m_nFeatures || Min.
Get_N() != m_nFeatures || Max.
Get_N() != m_nFeatures || Cov.
Get_NCols() != m_nFeatures || Cov.
Get_NRows() != m_nFeatures )
2643 CClass *pClass, **pClasses = (CClass **)
SG_Realloc(m_pClasses, ((
size_t)m_nClasses + 1) *
sizeof(CClass *));
2647 m_pClasses = pClasses;
2649 m_pClasses[m_nClasses++] = pClass =
new CClass(Class_ID);
2651 pClass->m_ID = Class_ID;
2652 pClass->m_Mean = Mean;
2653 pClass->m_Min = Min;
2654 pClass->m_Max = Max;
2655 pClass->m_Cov = Cov;
2675 for(
int i=0; i<m_nClasses; i++)
2677 m_pClasses[i]->m_Samples.Destroy();
2686 if( m_nFeatures > 0 && m_nFeatures == Features.
Get_N() )
2692 CClass **pClasses = (CClass **)
SG_Realloc(m_pClasses, ((
size_t)m_nClasses + 1) *
sizeof(CClass *));
2696 m_pClasses = pClasses;
2698 m_pClasses[iClass = m_nClasses++] =
new CClass(Class_ID);
2704 return( m_pClasses[iClass]->m_Samples.Add_Row(Features) );
2714 if( m_nFeatures < 1 || m_nClasses < 1 )
2719 for(
int iClass=0; iClass<m_nClasses; iClass++)
2721 if( !m_pClasses[iClass]->
Train() )
2727 if( bClear_Samples )
2741bool CSG_Classifier_Supervised::CClass::Train(
void)
2749 m_Mean.
Create(m_Samples.Get_NCols());
2750 m_Min .Create(m_Samples.Get_NCols());
2751 m_Max .Create(m_Samples.Get_NCols());
2753 for(
int iFeature=0; iFeature<m_Samples.Get_NCols(); iFeature++)
2755 CSG_Simple_Statistics s;
2757 for(
int iSample=0; iSample<m_Samples.Get_NRows(); iSample++)
2759 s += m_Samples[iSample][iFeature];
2768 m_Cov.Create(m_Samples.Get_NCols(), m_Samples.Get_NCols());
2770 for(
int iFeature=0; iFeature<m_Samples.Get_NCols(); iFeature++)
2772 for(
int jFeature=iFeature; jFeature<m_Samples.Get_NCols(); jFeature++)
2776 for(
int iSample=0; iSample<m_Samples.Get_NRows(); iSample++)
2778 cov += (m_Samples[iSample][iFeature] - m_Mean[iFeature]) * (m_Samples[iSample][jFeature] - m_Mean[jFeature]);
2781 if( m_Samples.Get_NRows() > 1 )
2783 cov /= m_Samples.Get_NRows() - 1;
2786 m_Cov[iFeature][jFeature] = m_Cov[jFeature][iFeature] = cov;
2790 m_Cov_Inv = m_Cov.Get_Inverse ();
2791 m_Cov_Det = m_Cov.Get_Determinant();
2793 m_Mean_Spectral = CSG_Simple_Statistics(m_Mean).Get_Mean();
2807 if( m_nFeatures > 0 )
2824 Class = -1; Quality = 0.;
2840 return( Class >= 0 );
2899void CSG_Classifier_Supervised::_Get_Binary_Encoding(
const CSG_Vector &Features,
int &Class,
double &Quality)
2903 CClass *pClass = m_pClasses[iClass];
2911 d += (Features(iFeature) < Mean_Spectral) == (pClass->m_Mean[iFeature] < pClass->m_Mean_Spectral) ? 0 : 1;
2915 d += (Features[iFeature ] < Features[iFeature + 1]) == (pClass->m_Mean[iFeature ] < pClass->m_Mean[iFeature + 1]) ? 0 : 1;
2919 d += (Features[iFeature - 1] < Features[iFeature ]) == (pClass->m_Mean[iFeature - 1] < pClass->m_Mean[iFeature ]) ? 0 : 1;
2923 d += (Features[iFeature - 1] < Features[iFeature + 1]) == (pClass->m_Mean[iFeature - 1] < pClass->m_Mean[iFeature + 1]) ? 0 : 1;
2927 if( Class < 0 || Quality > d )
2929 Class = iClass; Quality = d;
2935void CSG_Classifier_Supervised::_Get_Parallel_Epiped(
const CSG_Vector &Features,
int &Class,
double &Quality)
2939 CClass *pClass = m_pClasses[iClass];
2941 bool bMember =
true;
2945 bMember = pClass->m_Min[iFeature] <= Features[iFeature] && Features[iFeature] <= pClass->m_Max[iFeature];
2950 Class = iClass; Quality++;
2956void CSG_Classifier_Supervised::_Get_Minimum_Distance(
const CSG_Vector &Features,
int &Class,
double &Quality)
2960 CClass *pClass = m_pClasses[iClass];
2962 double Distance = (Features - pClass->m_Mean).Get_Length();
2964 if( Class < 0 || Quality > Distance )
2966 Class = iClass; Quality = Distance;
2970 if( m_Threshold_Distance > 0. && Quality > m_Threshold_Distance )
2977void CSG_Classifier_Supervised::_Get_Mahalanobis_Distance(
const CSG_Vector &Features,
int &Class,
double &Quality)
2981 CClass *pClass = m_pClasses[iClass];
2983 CSG_Vector D = Features - pClass->m_Mean;
2985 double Distance = D * (pClass->m_Cov_Inv * D);
2987 if( Class < 0 || Quality > Distance )
2989 Class = iClass; Quality = Distance;
2993 if( m_Threshold_Distance > 0. && Quality > m_Threshold_Distance )
3000void CSG_Classifier_Supervised::_Get_Maximum_Likelihood(
const CSG_Vector &Features,
int &Class,
double &Quality)
3006 CClass *pClass = m_pClasses[iClass];
3008 CSG_Vector D = Features - pClass->m_Mean;
3010 double Distance = D * (pClass->m_Cov_Inv * D);
3012 double Probability = pow(2. *
M_PI, -0.5 * m_nFeatures) * pow(pClass->m_Cov_Det, -0.5) * exp(-0.5 * Distance);
3015 dSum += Probability;
3017 if( Class < 0 || Quality < Probability )
3019 Class = iClass; Quality = Probability;
3025 if( m_Probability_Relative )
3027 Quality = 100. * Quality / dSum;
3030 if( m_Threshold_Probability > 0. && Quality < m_Threshold_Probability )
3038void CSG_Classifier_Supervised::_Get_Spectral_Angle_Mapping(
const CSG_Vector &Features,
int &Class,
double &Quality)
3042 CClass *pClass = m_pClasses[iClass];
3044 double Angle = Features.
Get_Angle(pClass->m_Mean);
3046 if( Class < 0 || Quality > Angle )
3048 Class = iClass; Quality = Angle;
3054 if( m_Threshold_Angle > 0. && Quality > m_Threshold_Angle )
3061void CSG_Classifier_Supervised::_Get_Spectral_Divergence(
const CSG_Vector &Features,
int &Class,
double &Quality)
3066void CSG_Classifier_Supervised::_Get_Winner_Takes_All(
const CSG_Vector &Features,
int &Class,
double &Quality)
3072 int iClass;
double iQuality;
3074 if( m_bWTA[iMethod] &&
Get_Class(Features, iClass, iQuality, iMethod) && ++Votes[iClass] > Quality )
3076 Class = iClass; Quality = Votes[iClass];
3099 if( !T || !df || df < 1. )
3112 if( p <= 0. || p >= 1. || df < 1 )
3118 double t = 0, p0, p1, diff = 1.;
3122 while( fabs(diff) > 0.0001 )
3124 t = Get_T_Inv(p1, df);
3125 diff = Get_T_P(t, df) - p0;
3129 return( bNegative ? -t : t );
3162 const double a1 = 0.0000053830, a2 = 0.0000488906, a3 = 0.0000380036;
3163 const double a4 = 0.0032776263, a5 = 0.0211410061, a6 = 0.0498673470;
3167 double p = (((((a1 * z + a2) * z + a3) * z + a4) * z + a5) * z + a6) * z + 1.;
3169 return( pow(p, -16) );
3175 const double a0 = 2.5066282, a1 = -18.6150006, a2 = 41.3911977, a3 = -25.4410605;
3176 const double b1 = -8.4735109, b2 = 23.0833674, b3 = -21.0622410, b4 = 3.1308291;
3177 const double c0 = -2.7871893, c1 = -2.2979648, c2 = 4.8501413, c3 = 2.3212128;
3178 const double d1 = 3.5438892, d2 = 1.6370678;
3182 double r = sqrt(-log(0.5 - p));
3184 return( (((c3 * r + c2) * r + c1) * r + c0) / ((d2 * r + d1) * r + 1.) );
3190 return( p * (((a3 * r + a2) * r + a1) * r + a0) / ((((b4 * r + b3) * r + b2) * r + b1) * r + 1.) );
3195double CSG_Test_Distribution::Get_T_P(
double T,
int df)
3197 return( df == 1 ? 1. - 2. * atan(fabs(T)) /
M_PI
3198 : df == 2 ? 1. - fabs(T) / sqrt(T*T + 2.)
3199 : df == 3 ? 1. - 2. * (atan(fabs(T) / sqrt(3.)) + fabs(T) * sqrt(3.) / (T*T + 3.)) /
M_PI
3200 : df == 4 ? 1. - fabs(T) * (1. + 2. / (T*T + 4.)) / sqrt(T*T + 4.)
3201 : Get_Norm_P(Get_T_Z(fabs(T), df))
3206double CSG_Test_Distribution::Get_T_Z(
double T,
int df)
3210 double A9, B9, T9, Z8, P7, B7, z;
3217 : A9 * (((1. - T9 * 0.75) * T9 / 3. - 0.5) * T9 + 1.) * T9;
3218 P7 = ((0.4 * Z8 + 3.3) * Z8 + 24.) * Z8 + 85.5;
3219 B7 = 0.8 * pow(Z8, 2.) + 100. + B9;
3220 z = (1. + (-P7 / B7 + Z8 + 3.) / B9) * sqrt(Z8);
3226double CSG_Test_Distribution::Get_T_Inv(
double p,
int df)
3232 return( cos(p *
M_PI / 2.) / sin(p *
M_PI / 2.) );
3237 return( sqrt(2. / (p * (2. - p)) - 2.) );
3240 double a = 1. / (df - 0.5);
3241 double b = 48. / (a*a);
3242 double c = ((20700. * a / b - 98.) * a - 16.) * a + 96.36;
3243 double d = ((94.5 / (b + c) - 3.) / b + 1.) * sqrt(a *
M_PI / 2.) * df;
3245 double y = pow(x, 2. / df);
3249 x = Get_Norm_Z(0.5 * (1. - p));
3254 c = c + 0.3 * (df - 4.5) * (x + 0.6);
3257 c = (((0.05 * d * x - 5) * x - 7.) * x - 2.) * x + b + c;
3258 y = (((((0.4 * y + 6.3) * y + 36.) * y + 94.5) / c - y - 3.) / b + 1.) * x;
3272 y = ((1. / (((df + 6.) / (df * y) - 0.089 * d - 0.822) * (df + 2.) * 3.)
3273 + 0.5 / (df + 4.)) * y - 1.) * (df + 1.) / (df + 2.) + 1. / y;
3276 return( sqrt(df * y) );
3287 double F = ((
sLong)nSamples - (
sLong)nPredictors - 1) * (R2 / nPredictors) / (1. - R2);
3299 if( F >= 0.00001 && dfn > 0 && dfd > 0 )
3301 if( F * dfn >= dfd || F > 1. + 20. / dfn + 10. / sqrt((
double)dfn) )
3303 p = Get_Gamma(F, dfn, dfd);
3307 p = 1. - Get_Gamma(1. / F, dfd, dfn);
3311 if( p <= 0. || p >= 1. )
3313 p = F > 1. ? 0. : F < 1. ? 1. : 0.5;
3322 if( alpha < 0. || alpha > 1. || dfd < 0 || dfn < 0 )
3332 const int ITERMAX = 100;
3333 const double EPSILON = 0.0001;
3336 double lo, hi, mid, p;
3343 for(i=0; i<ITERMAX; i++)
3368 for(i=0; i<ITERMAX; i++)
3389 mid = (hi + lo) / 2.;
3391 for(i=0; i<ITERMAX && (hi-lo)>
EPSILON*mid; i++)
3393 mid = (hi + lo) / 2.;
3398 else if( p > alpha )
3408double CSG_Test_Distribution::Get_Gamma(
double F,
double dfn,
double dfd)
3412 const double EXPMIN = -30.;
3413 const double SMALL = 0.00000000001;
3415 double x, c, er, s, n, t1, t;
3420 x = dfd / (dfd + dfn * F);
3421 c = Get_Log_Gamma(dfn + dfd) - Get_Log_Gamma(dfn) - Get_Log_Gamma(dfd + 1.) + dfd * log(x) + dfn * log(1. - x);
3437 while( t > er || t > t1 )
3441 t *= ((dfn + n) * x / (dfd + n));
3449double CSG_Test_Distribution::Get_Log_Gamma(
double a)
3453 const int ARGMIN = 6;
3455 const double HL2PI = 0.91893853320467275;
3457 int n = (int)floor(ARGMIN - a + 0.0001);
3467 g = (1. - g * (1. / 30. - g * (1. / 105. - g * (1. / 140. - g / 99.)))) / (12. * a);
3468 g = g + ((a - 0.5) * log(a) - a + HL2PI);
3470 for(
int i=0; i<n; i++)
3489 int nVariables = Values.
Get_NX();
3490 int nSamples = Values.
Get_NY();
3497 C.Create(nVariables, nVariables);
3502 for(j=0; j<nVariables; j++)
3504 for(i=0; i<nSamples; i++)
3506 S[j] += Values[i][j];
3511 for(k=0; k<nVariables; k++)
3513 for(j=k; j<nVariables; j++)
3517 for(i=0; i<nSamples; i++)
3519 cov += (Values[i][j] - S[j].
Get_Mean()) * (Values[i][k] - S[k].
Get_Mean());
3526 cov /= (S[j].
Get_StdDev() * S[k].Get_StdDev());
3529 C[j][k] =
C[k][j] = cov;
bool SG_UI_Process_Get_Okay(bool bBlink)
void SG_UI_Process_Set_Text(const CSG_String &Text)
SAGA_API_DLL_EXPORT void * SG_Malloc(size_t size)
SAGA_API_DLL_EXPORT void SG_Free(void *memblock)
SAGA_API_DLL_EXPORT void * SG_Realloc(void *memblock, size_t size)
SAGA_API_DLL_EXPORT void * SG_Calloc(size_t num, size_t size)
#define SG_FREE_SAFE(PTR)
SAGA_API_DLL_EXPORT CSG_String SG_Get_String(double Value, int Precision=-99)
sLong Get_Size(void) const
void * Get_Entry(sLong Index) const
Returns a pointer to the memory address of the requested variable. You have to type cast and derefere...
void Create(TSG_Data_Type Type=SG_DATATYPE_String)
virtual ~CSG_Category_Statistics(void)
int Get_Category(int Value) const
int asInt(int iCategory) const
double asDouble(int iCategory) const
int Get_Count(void) const
CSG_Category_Statistics(TSG_Data_Type Type=SG_DATATYPE_String)
CSG_String asString(int iCategory) const
TSG_Data_Type Get_Category_Type(void) const
void Set_Probability_Relative(bool Value)
virtual ~CSG_Classifier_Supervised(void)
void Set_Threshold_Distance(double Value)
CSG_Classifier_Supervised(void)
double Get_Threshold_Probability(void)
void Create(int nFeatures)
int Get_Class_Count(void)
int Get_Feature_Count(void)
bool Add_Class(const CSG_String &Class_ID, const CSG_Vector &Mean, const CSG_Vector &Min, const CSG_Vector &Max, const CSG_Matrix &Cov)
void Set_Threshold_Probability(double Value)
bool Get_Probability_Relative(void)
bool Train(bool bClr_Samples=false)
const CSG_String & Get_Class_ID(int iClass)
void Set_Threshold_Angle(double Value)
bool Train_Add_Sample(const CSG_String &Class_ID, const CSG_Vector &Features)
double Get_Threshold_Distance(void)
static CSG_String Get_Name_of_Quality(int Method)
int Get_Class(const CSG_String &Class_ID)
void Set_WTA(int Method, bool bOn)
bool Train_Clr_Samples(void)
bool Save(const CSG_String &File, const SG_Char *Feature_Info=NULL)
static CSG_String Get_Name_of_Method(int Method)
bool Load(const CSG_String &File)
double Get_Threshold_Angle(void)
bool Create(int nFeatures)
bool Execute(int Method, int nClusters, int nMaxIterations=0, int Initialization=0)
bool Set_Feature(sLong iElement, int iFeature, double Value)
sLong Get_nElements(void) const
virtual ~CSG_Cluster_Analysis(void)
CSG_Cluster_Analysis(void)
virtual bool is_NoData(int x, int y) const
virtual double asDouble(sLong i, bool bScaled=true) const
sLong Get_NCells(void) const
virtual bool is_NoData(int x, int y, int z) const
sLong Get_NCells(void) const
virtual double asDouble(sLong i, bool bScaled=true) const
CSG_Histogram & operator=(const CSG_Histogram &Histogram)
bool Scale_Element_Count(double Scale)
virtual ~CSG_Histogram(void)
double Get_Center(int i) const
void Add_Value(double Value)
double Get_Value(double i) const
size_t Get_Class_Count(void) const
size_t Get_Cumulative(int i) const
bool Create(const CSG_Histogram &Histogram)
double Get_Quantile(double Quantile) const
double Get_Percentile_Value(double Value) const
double Get_Percentile(double Percentile) const
bool Add_Histogram(const CSG_Histogram &Histogram)
double Get_Break(int i) const
size_t Get_Element_Count(void) const
double Get_Quantile_Value(double Value) const
sLong Get_NRows(void) const
bool from_String(const CSG_String &String)
sLong Get_NCols(void) const
double Get_Determinant(void) const
bool is_Square(void) const
CSG_String to_String(int Width=-1, int Precision=-1, bool bScientific=false, const SG_Char *Separator=NULL) const
CSG_Matrix Get_Inverse(bool bSilent=true, int nSubSquare=0) const
virtual ~CSG_Natural_Breaks(void)
bool Create(class CSG_Table *pTable, int Field, int nClasses, int Histogram=0)
int Get_Count(void) const
static double Get_Gaussian(double mean, double stddev)
static void Initialize(void)
static double Get_Uniform(void)
sLong Get_IndexOfMinimum(void)
void Add(const CSG_Simple_Statistics &Statistics)
double Get_Percentile(double Percentile)
double Get_Value(sLong i) const
CSG_Simple_Statistics(void)
sLong Get_nValues_Above(double Threshold, bool bEquals=false)
sLong Get_nValues_Below(double Threshold, bool bEquals=false)
int is_Evaluated(void) const
double * Get_Values(void) const
double Get_SkewnessPearson(void)
sLong Get_IndexOfMaximum(void)
bool Set_Count(sLong Count)
void _Evaluate(int Level=1)
bool Create(bool bHoldValues=false)
sLong Get_Count(void) const
void Add_Value(double Value, double Weight=1.)
double Get_Quantile(double Quantile)
int Cmp(const CSG_String &String) const
static CSG_String Format(const char *Format,...)
bool is_Empty(void) const
bool Create(const class wxString *pString)
sLong Get_Index(void) const
double asDouble(int Field) const
int asInt(int Field) const
const SG_Char * asString(int Field, int Decimals=-99) const
bool Add_Value(int Field, double Value)
sLong Get_Count(void) const
virtual bool Get_Value(sLong Index, int Field, CSG_String &Value) const
bool Set_Index(CSG_Index &Index, int Field, bool bAscending=true) const
int Get_Field_Count(void) const
CSG_Table_Record * Get_Record_byIndex(sLong Index) const
static double Get_Norm_P(double Z)
static double Get_F_Inverse(double alpha, int dfn, int dfd, TSG_Test_Distribution_Type Type=TESTDIST_TYPE_Right)
static double Get_F_Tail_from_R2(double R2, int nPredictors, int nSamples, TSG_Test_Distribution_Type Type=TESTDIST_TYPE_Right)
static double Get_T_Tail(double T, int df, TSG_Test_Distribution_Type Type=TESTDIST_TYPE_Right)
static double Get_F_Tail(double F, int dfn, int dfd, TSG_Test_Distribution_Type Type=TESTDIST_TYPE_Right)
static double Get_Norm_Z(double P)
static double Get_T_Inverse(double alpha, int df, TSG_Test_Distribution_Type Type=TESTDIST_TYPE_Right)
void Add_Value(double Value, double Weight=1.)
virtual void Create(bool bWeights=false)
int Get_Class_Index(double Value) const
void Add_Value(const CSG_String &Value, double Weight=1.)
virtual void Create(bool bWeights=false)
int Get_Class_Index(const CSG_String &Value) const
virtual int Get_Minority(bool bWeighted=false) const
int Get_Count(void) const
virtual int Get_Majority(bool bWeighted=false) const
CSG_String to_String(int Width=-1, int Precision=-1, bool bScientific=false, const SG_Char *Separator=NULL) const
sLong Get_Size(void) const
double Get_Angle(const CSG_Vector &Vector) const
bool from_String(const CSG_String &String)
int SG_Compare_Version(const CSG_String &Version, int Major, int Minor, int Release)