> ### Tea Tasting ####
> ### Fisher's Exact test a quick colution in R###
> ### More details on this example corresponding to SAS output ###
> ##########################################
> 
> ### Fisher's Exact test a quick solution in R with output ###
> # data entry 
> 
> tea<- matrix(c(3, 1, 1, 3), ncol= 2, dimnames = list(Truth = c("Tea","Milk" ),Lady_says = c("Tea first","Milk first")))
> 
> # one-sided Fisher's exact test
> fisher.test(tea, alternative = "greater")

	Fisher's Exact Test for Count Data

data:  tea 
p-value = 0.2429
alternative hypothesis: true odds ratio is greater than 1 
95 percent confidence interval:
 0.3135693       Inf 
sample estimates:
odds ratio 
  6.408309 

> 
> # two-sided Fisher's exact test
> fisher.test(tea)

	Fisher's Exact Test for Count Data

data:  tea 
p-value = 0.4857
alternative hypothesis: true odds ratio is not equal to 1 
95 percent confidence interval:
   0.2117329 621.9337505 
sample estimates:
odds ratio 
  6.408309 

> 
> #######OUTPUT for one-sided test #########
> #Fisher's Exact Test for Count Data
> #
> #data:  tea 
> #p-value = 0.2429
> #alternative hypothesis: true odds ratio is greater than 1 
> #95 percent confidence interval:
> # 0.3135693       Inf 
> #sample estimates:
> #odds ratio 
> # 6.408309 
> 
> ######## CONCLUSION ########
> # We cannot reject the null hypothesis, that is there is not enough evidence to establish association
> 
> ###### What is the conclusion for two-sided test? ##############
> 
> ################################################################
> #### Another approach ##########################################
> TeaLady=matrix(c(3, 1, 1, 3), ncol=2, dimnames=list(Poured=c("tea", "milk"), Lady=c("tea", "milk")))
> TeaLady
      Lady
Poured tea milk
  tea    3    1
  milk   1    3
> 
> ### Pearson's Chi-squared test  with Yates' continuity correction
> 
> result=chisq.test(TeaLady)
Warning message:
In chisq.test(TeaLady) : Chi-squared approximation may be incorrect
> result

	Pearson's Chi-squared test with Yates' continuity correction

data:  TeaLady 
X-squared = 0.5, df = 1, p-value = 0.4795

> 
> ### Let's look at the obseved, expected values and the residuals
> result$observed
      Lady
Poured tea milk
  tea    3    1
  milk   1    3
> result$expected
      Lady
Poured tea milk
  tea    2    2
  milk   2    2
> result$residuals
      Lady
Poured        tea       milk
  tea   0.7071068 -0.7071068
  milk -0.7071068  0.7071068
> 
> 
> ### Let us look at the Percentage, Row Percentage and Column Percentage 
> ### of the total observations contained in each cell.
> 
> Contingency_Table=list(Frequency=TeaLady,Expected=result$expected,Percentage=prop.table(TeaLady),RowPercentage=prop.table(TeaLady,1),ColPercentage=prop.table(TeaLady,2))
> 
> ### Pearson's Chi-squared test  withOUT Yates' continuity correction
> result=chisq.test(TeaLady, correct=FALSE)
Warning message:
In chisq.test(TeaLady, correct = FALSE) :
  Chi-squared approximation may be incorrect
> result

	Pearson's Chi-squared test

data:  TeaLady 
X-squared = 2, df = 1, p-value = 0.1573

> result$observed
      Lady
Poured tea milk
  tea    3    1
  milk   1    3
> result$expected
      Lady
Poured tea milk
  tea    2    2
  milk   2    2
> result$residuals
      Lady
Poured        tea       milk
  tea   0.7071068 -0.7071068
  milk -0.7071068  0.7071068
> 
> ### Likelihood Ratio Chi-Squared Statistic
> LR=2*sum(TeaLady*log(TeaLady/result$expected))
> LR
[1] 2.092993
> ### p-value for the Likelihood Ratio Test
> LRchisq=1-pchisq(LR,df=1)
> LRchisq
[1] 0.1479760
> 
> ### Fisher's Exact Test
> Fisher_Exact_TwoSided=fisher.test(TeaLady,alternative = "two.sided")
> Fisher_Exact_Less=fisher.test(TeaLady,alternative = "less")
> Fisher_Exact_Greater=fisher.test(TeaLady,alternative = "greater")
> list(Fisher_Exact_TwoSided=Fisher_Exact_TwoSided,Fisher_Exact_Less=Fisher_Exact_Less,Fisher_Exact_Greater=Fisher_Exact_Greater)
$Fisher_Exact_TwoSided

	Fisher's Exact Test for Count Data

data:  TeaLady 
p-value = 0.4857
alternative hypothesis: true odds ratio is not equal to 1 
95 percent confidence interval:
   0.2117329 621.9337505 
sample estimates:
odds ratio 
  6.408309 


$Fisher_Exact_Less

	Fisher's Exact Test for Count Data

data:  TeaLady 
p-value = 0.9857
alternative hypothesis: true odds ratio is less than 1 
95 percent confidence interval:
   0.0000 306.2469 
sample estimates:
odds ratio 
  6.408309 


$Fisher_Exact_Greater

	Fisher's Exact Test for Count Data

data:  TeaLady 
p-value = 0.2429
alternative hypothesis: true odds ratio is greater than 1 
95 percent confidence interval:
 0.3135693       Inf 
sample estimates:
odds ratio 
  6.408309 


> 
> RowSums=rowSums(TeaLady)
> ColSums=colSums(TeaLady)
> ### Column 1 Risk Estmates
> 
> risk1_col1=TeaLady[1,1]/RowSums[1]
> risk2_col1=TeaLady[2,1]/RowSums[2]
> rho1=risk1_col1/risk2_col1
> total1=ColSums[1]/sum(RowSums)
> diff1=risk1_col1-risk2_col1
> list(Row1_Risk=risk1_col1,Row2_Risk=risk2_col1,Total=total1,difference=diff1)
$Row1_Risk
 tea 
0.75 

$Row2_Risk
milk 
0.25 

$Total
tea 
0.5 

$difference
tea 
0.5 

> 
> ### The confidence interval for the difference in proportions for column 1
> 
> SE_diff1=sqrt(risk1_col1*(1-risk1_col1)/RowSums[1]+risk2_col1*(1-risk2_col1)/RowSums[2])
> CI_diff1=cbind(diff1-qnorm(0.975)*SE_diff1,diff1+qnorm(0.975)*SE_diff1)
> SE_diff1
      tea 
0.3061862 
> CI_diff1
          [,1]     [,2]
tea -0.1001140 1.100114
> 
> ### Column 2 Risk Estmates
> 
> risk1_col2=TeaLady[1,2]/RowSums[1]
> risk2_col2=TeaLady[2,2]/RowSums[2]
> total2=ColSums[2]/sum(RowSums)
> diff2=risk1_col2-risk2_col2
> list(Row1_Risk=risk1_col1,Row2_Risk=risk2_col1,Total=total1,difference=diff2)
$Row1_Risk
 tea 
0.75 

$Row2_Risk
milk 
0.25 

$Total
tea 
0.5 

$difference
 tea 
-0.5 

> 
> ### The confidence interval for the difference in proportions for column 2
> 
> SE_diff2=sqrt(risk1_col2*(1-risk1_col2)/RowSums[1]+risk2_col2*(1-risk2_col2)/RowSums[2])
> CI_diff2=cbind(diff2-qnorm(0.975)*SE_diff2,diff2+qnorm(0.975)*SE_diff2)
> SE_diff2
      tea 
0.3061862 
> CI_diff2
         [,1]      [,2]
tea -1.100114 0.1001140
> 
> ### Estimate of the Odds of the two rows
> 
> odds1=(TeaLady[2,1]/RowSums[2])/(TeaLady[1,1]/RowSums[1])
> odds2=(TeaLady[2,2]/RowSums[2])/(TeaLady[1,2]/RowSums[1])
> odds1
     milk 
0.3333333 
> odds2
milk 
   3 
> ### Odds Ratio
> oddsratio=odds2/odds1
> oddsratio
milk 
   9 
> 
> ### Confidence Interval of the odds ratio
> log_CI=cbind(log(oddsratio)-qnorm(0.975)*sqrt(sum(1/TeaLady)),log(oddsratio)+qnorm(0.975)*sqrt(sum(1/TeaLady)))
> CI_oddsratio=exp(log_CI)
> CI_oddsratio
          [,1]    [,2]
milk 0.3666369 220.927
> 
>