% 1. Title: Pima Indians Diabetes Database
% 
% 2. Sources:
%    (a) Original owners: National Institute of Diabetes and Digestive and
%                         Kidney Diseases
%    (b) Donor of database: Vincent Sigillito (vgs@aplcen.apl.jhu.edu)
%                           Research Center, RMI Group Leader
%                           Applied Physics Laboratory
%                           The Johns Hopkins University
%                           Johns Hopkins Road
%                           Laurel, MD 20707
%                           (301) 953-6231
%    (c) Date received: 9 May 1990
% 
% 3. Past Usage:
%     1. Smith,~J.~W., Everhart,~J.~E., Dickson,~W.~C., Knowler,~W.~C., \&
%        Johannes,~R.~S. (1988). Using the ADAP learning algorithm to forecast
%        the onset of diabetes mellitus.  In {\it Proceedings of the Symposium
%        on Computer Applications and Medical Care} (pp. 261--265).  IEEE
%        Computer Society Press.
% 
%        The diagnostic, binary-valued variable investigated is whether the
%        patient shows signs of diabetes according to World Health Organization
%        criteria (i.e., if the 2 hour post-load plasma glucose was at least 
%        200 mg/dl at any survey  examination or if found during routine medical
%        care).   The population lives near Phoenix, Arizona, USA.
% 
%        Results: Their ADAP algorithm makes a real-valued prediction between
%        0 and 1.  This was transformed into a binary decision using a cutoff of 
%        0.448.  Using 576 training instances, the sensitivity and specificity
%        of their algorithm was 76% on the remaining 192 instances.
% 
% 4. Relevant Information:
%       Several constraints were placed on the selection of these instances from
%       a larger database.  In particular, all patients here are females at
%       least 21 years old of Pima Indian heritage.  ADAP is an adaptive learning
%       routine that generates and executes digital analogs of perceptron-like
%       devices.  It is a unique algorithm; see the paper for details.
% 
% 5. Number of Instances: 768
% 
% 6. Number of Attributes: 8 plus class 
% 
% 7. For Each Attribute: (all numeric-valued)
%    1. Number of times pregnant
%    2. Plasma glucose concentration a 2 hours in an oral glucose tolerance test
%    3. Diastolic blood pressure (mm Hg)
%    4. Triceps skin fold thickness (mm)
%    5. 2-Hour serum insulin (mu U/ml)
%    6. Body mass index (weight in kg/(height in m)^2)
%    7. Diabetes pedigree function
%    8. Age (years)
%    9. Class variable (0 or 1)
% 
% 8. Missing Attribute Values: None
% 
% 9. Class Distribution: (class value 1 is interpreted as "tested positive for
%    diabetes")
% 
%    Class Value  Number of instances
%    0            500
%    1            268
% 
% 10. Brief statistical analysis:
% 
%     Attribute number:    Mean:   Standard Deviation:
%     1.                     3.8     3.4
%     2.                   120.9    32.0
%     3.                    69.1    19.4
%     4.                    20.5    16.0
%     5.                    79.8   115.2
%     6.                    32.0     7.9
%     7.                     0.5     0.3
%     8.                    33.2    11.8
% 
% 
%
%
%
%
% Relabeled values in attribute 'class'
%    From: 0                       To: tested_negative     
%    From: 1                       To: tested_positive     
%
@relation pima_diabetes
@attribute 'preg' real
@attribute 'plas' real
@attribute 'pres' real
@attribute 'skin' real
@attribute 'insu' real
@attribute 'mass' real
@attribute 'pedi' real
@attribute 'age' real
@attribute 'class' {tested_negative,tested_positive}
@data
3,173,78,39,185,33.8,0.97,31,tested_positive
9,165,88,0,0,30.4,0.302,49,tested_positive
13,152,90,33,29,26.8,0.731,43,tested_positive
8,120,86,0,0,28.4,0.259,22,tested_positive
0,135,68,42,250,42.3,0.365,24,tested_positive
7,129,68,49,125,38.5,0.439,43,tested_positive
3,187,70,22,200,36.4,0.408,36,tested_positive
4,136,70,0,0,31.2,1.182,22,tested_positive
3,128,72,25,190,32.4,0.549,27,tested_positive
0,138,0,0,0,36.3,0.933,25,tested_positive
7,147,76,0,0,39.4,0.257,43,tested_positive
1,117,88,24,145,34.5,0.403,40,tested_positive
4,145,82,18,0,32.5,0.235,70,tested_positive
0,109,88,30,0,32.5,0.855,38,tested_positive
7,196,90,0,0,39.8,0.451,41,tested_positive
4,148,60,27,318,30.9,0.15,29,tested_positive
8,186,90,35,225,34.5,0.423,37,tested_positive
12,92,62,7,258,27.6,0.926,44,tested_positive
1,199,76,43,0,42.9,1.394,22,tested_positive
0,162,76,36,0,49.6,0.364,26,tested_positive
2,146,0,0,0,27.5,0.24,28,tested_positive
0,121,66,30,165,34.3,0.203,33,tested_positive
1,115,70,30,96,34.6,0.529,32,tested_positive
6,0,68,41,0,39,0.727,41,tested_positive
1,180,0,0,0,43.3,0.282,41,tested_positive
4,134,72,0,0,23.8,0.277,60,tested_positive
1,126,56,29,152,28.7,0.801,21,tested_negative
2,88,74,19,53,29,0.229,22,tested_negative
1,136,74,50,204,37.4,0.399,24,tested_negative
4,117,64,27,120,33.2,0.23,24,tested_negative
1,0,68,35,0,32,0.389,22,tested_negative
2,96,68,13,49,21.1,0.647,26,tested_negative
0,114,80,34,285,44.2,0.167,27,tested_negative
3,125,58,0,0,31.6,0.151,24,tested_negative
0,111,65,0,0,24.6,0.66,31,tested_negative
2,94,76,18,66,31.6,0.649,23,tested_negative
6,144,72,27,228,33.9,0.255,40,tested_negative
5,88,78,30,0,27.6,0.258,37,tested_negative
5,44,62,0,0,25,0.587,36,tested_negative
7,83,78,26,71,29.3,0.767,36,tested_negative
3,124,80,33,130,33.2,0.305,26,tested_negative
11,138,76,0,0,33.2,0.42,35,tested_negative
1,0,74,20,23,27.7,0.299,21,tested_negative
0,101,64,17,0,21,0.252,21,tested_negative
3,120,70,30,135,42.9,0.452,30,tested_negative
0,95,64,39,105,44.6,0.366,22,tested_negative
9,154,78,30,100,30.9,0.164,45,tested_negative
4,144,58,28,140,29.5,0.287,37,tested_negative
10,92,62,0,0,25.9,0.167,31,tested_negative
0,93,60,0,0,35.3,0.263,25,tested_negative
4,189,110,31,0,28.5,0.68,37,tested_negative
5,143,78,0,0,45,0.19,47,tested_negative
1,107,72,30,82,30.8,0.821,24,tested_negative
0,74,52,10,36,27.8,0.269,22,tested_negative
1,80,55,0,0,19.1,0.258,21,tested_negative
2,99,0,0,0,22.2,0.108,23,tested_negative
5,132,80,0,0,26.8,0.186,69,tested_negative
1,109,56,21,135,25.2,0.833,23,tested_negative
2,122,60,18,106,29.8,0.717,22,tested_negative
6,137,61,0,0,24.2,0.151,55,tested_negative
0,129,80,0,0,31.2,0.703,29,tested_negative
9,106,52,0,0,31.2,0.38,42,tested_negative
2,92,76,20,0,24.2,1.698,28,tested_negative
4,131,68,21,166,33.1,0.16,28,tested_negative
1,121,78,39,74,39,0.261,28,tested_negative
9,57,80,37,0,32.8,0.096,41,tested_negative
4,83,86,19,0,29.3,0.317,34,tested_negative
0,78,88,29,40,36.9,0.434,21,tested_negative
3,87,60,18,0,21.8,0.444,21,tested_negative
1,96,64,27,87,33.2,0.289,21,tested_negative
0,119,64,18,92,34.9,0.725,23,tested_negative
4,84,90,23,56,39.5,0.159,25,tested_negative
3,103,72,30,152,27.6,0.73,27,tested_negative
0,161,50,0,0,21.9,0.254,65,tested_negative
2,141,58,34,128,25.4,0.699,24,tested_negative
2,56,56,28,45,24.2,0.332,22,tested_negative
