#r "nuget: FSharpAux, 1.1.0"
#r "nuget: Plotly.NET.Interactive, 4.0.0"
#r "nuget: FSharp.Stats, 0.4.11"

open Plotly.NET
open Plotly.NET.StyleParam
open Plotly.NET.LayoutObjects

module Chart = 
    let myAxis name = LinearAxis.init(Title=Title.init name,Mirror=StyleParam.Mirror.All,Ticks=StyleParam.TickOptions.Inside,ShowGrid=false,ShowLine=true)
    let withAxisTitles x y chart = 
        chart 
        |> Chart.withTemplate ChartTemplates.lightMirrored
        |> Chart.withXAxis (myAxis x) 
        |> Chart.withYAxis (myAxis y)


open FSharpAux
open FSharp.Stats

let distributionA = Distributions.ContinuousDistribution.normal 10.0 1.0
let distributionB = Distributions.ContinuousDistribution.normal 10.0 1.0

[
    Chart.Area([5. .. 0.01 .. 15.] |> List.map (fun x -> x,distributionA.PDF x),Name = "distA")
    Chart.Area([5. .. 0.01 .. 15.] |> List.map (fun x -> x,distributionB.PDF x),Name = "distB")
]
|> Chart.combine
|> Chart.withAxisTitles "variable X" "relative count"
|> Chart.withSize (900.,600.)
|> Chart.withTitle "null hypothesis"


let getSample n (dist: Distributions.ContinuousDistribution<float,float>) =
    Vector.init n (fun _ -> dist.Sample())
    
let sampleA = getSample 5 distributionA
let sampleB = getSample 5 distributionB

(Testing.TTest.twoSample true sampleA sampleB).PValue

0.760894895653307


let distributionC = Distributions.ContinuousDistribution.normal 11.5 1.0


let bonferroniLine = 
    Shape.init(
        ShapeType = ShapeType.Line,
        X0 = 0.,
        X1 = 35.,
        Y0 = 0.05,
        Y1 = 0.05,
        Line=Line.init(Dash=DrawingStyle.Dash)
    )

[1..35]
|> List.map (fun x -> 
    x,(1. - (1. - 0.05)**(float x))
    )
|> Chart.Point
|> Chart.withYAxisStyle("",MinMax=(0.,1.))
|> Chart.withAxisTitles "#tests" "p(at least one FP)" 
|> Chart.withShape bonferroniLine
|> Chart.withTitle "FWER"


let examplePVals =
    System.IO.File.ReadAllLines(@"../../files/pvalExample.txt")
    |> Array.tail
    |> Array.map float

//number of tests
let m =  
    examplePVals
    |> Array.length
    |> float

let nullLine =
    Shape.init(
        ShapeType = ShapeType.Line,
        X0 = 0.,
        X1 = 1.,
        Y0 = 1.,
        Y1 = 1.,
        Line=Line.init(Dash=DrawingStyle.Dash)
    )

let empLine =
    Shape.init(
        ShapeType = ShapeType.Line,
        X0 = 0.,
        X1 = 1.,
        Y0 = 0.4,
        Y1 = 0.4,
        Line=Line.init(Dash=DrawingStyle.DashDot,Color=Color.fromHex "#FC3E36")
    )

[
    [
    examplePVals
    |> Distributions.Frequency.create 0.025
    |> Map.toArray 
    |> Array.map (fun (k,c) -> k,float c / (m * 0.025))
    |> Chart.Column
    |> Chart.withTraceInfo "density"
    |> Chart.withAxisTitles "p value" "density"
    |> Chart.withShapes [nullLine;empLine]

    examplePVals
    |> Distributions.Frequency.create 0.025
    |> Map.toArray 
    |> Array.map (fun (k,c) -> k,float c)
    |> Chart.Column
    |> Chart.withTraceInfo "gene count"
    |> Chart.withAxisTitles "p value" "gene count"
    ]
]
|> Chart.Grid()
|> Chart.withSize(1100.,550.)


let pi0 = 0.4

let getD p = 
    examplePVals 
    |> Array.sumBy (fun x -> if x <= p then 1. else 0.) 

let getFP p = p * pi0 * m

let getFDR p = (getFP p) / (getD p)

let qvaluesNotSmoothed = 
    examplePVals
    |> Array.sort
    |> Array.map (fun x -> 
        x, getFDR x)
    |> Chart.Line 
    |> Chart.withTraceInfo "not smoothed"

let qvaluesSmoothed = 
    let pValsSorted =
        examplePVals
        |> Array.sortDescending
    let rec loop i lowest acc  = 
        if i = pValsSorted.Length then 
            acc |> List.rev
        else 
            let p = pValsSorted.[i]
            let q = getFDR p
            if q > lowest then  
                loop (i+1) lowest ((p,lowest)::acc)
            else loop (i+1) q ((p,q)::acc)
    loop 0 1. []
    |> Chart.Line
    |> Chart.withTraceInfo "smoothed"

let eXpos = examplePVals |> Array.filter (fun x -> x <= 0.046135) |> Array.length


[qvaluesNotSmoothed;qvaluesSmoothed]
|> Chart.combine
|> Chart.withYAxisStyle("",MinMax=(0.,1.))
|> Chart.withAxisTitles "p value" "q value"
|> Chart.withShape empLine
|> Chart.withTitle (sprintf "#[genes with q value < 0.05] = %i" eXpos)


let pi0Est = 
    [|0. .. 0.05 .. 0.95|]
    |> Array.map (fun lambda -> 
        let num = 
            examplePVals 
            |> Array.sumBy (fun x -> if x > lambda then 1. else 0.) 
        let den = float examplePVals.Length * (1. - lambda)
        lambda, num/den
        )

pi0Est 
|> Chart.Point
|> Chart.withYAxisStyle("",MinMax=(0.,1.))
|> Chart.withXAxisStyle("",MinMax=(0.,1.))
|> Chart.withAxisTitles "$\lambda$" "$\hat \pi_0(\lambda)$"
|> Chart.withMathTex(true)
|> Chart.withConfig(
    Config.init(
        Responsive=true, 
        ModeBarButtonsToAdd=[
            ModeBarButton.DrawLine
            ModeBarButton.DrawOpenPath
            ModeBarButton.EraseShape
            ]
        )
    )


let getpi0Bootstrap (lambda:float[]) (pValues:float[]) =
    let rnd = System.Random()
    let m = pValues.Length |> float
    let getpi0hat lambda pVals=
        let hits = 
            pVals 
            |> Array.sumBy (fun x -> if x > lambda then 1. else 0.) 
        hits / (m * (1. - lambda))
    
    //calculate MSE for each lambda
    let getMSE lambda =
        let mse = 
            //generate 100 bootstrap samples of p values and calculate the MSE at given lambda
            Array.init 100 (fun b -> 
                Array.sampleWithReplacement rnd pValues pValues.Length  
                |> getpi0hat lambda
                )
        mse
    lambda
    |> Array.map (fun l -> l,getMSE l)
    

let minimalpihat = 
    //FSharp.Stats.Testing.MultipleTesting.Qvalues.pi0hats  [|0. .. 0.05 .. 0.96|] examplePVals |> Array.minBy snd |> snd
    0.3686417749

let minpiHatShape = 
    Shape.init(
        ShapeType = ShapeType.Line,
        X0 = 0.,
        X1 = 1.,
        Y0 = minimalpihat,
        Y1 = minimalpihat,
        Line=Line.init(Dash=DrawingStyle.Dash)
    )


getpi0Bootstrap [|0. .. 0.05 .. 0.95|] examplePVals
|> Array.map (fun (l,x) -> 
    Chart.BoxPlot(X=Array.init x.Length (fun _ -> l),Y=x,FillColor=Color.fromHex"#1F77B4",MarkerColor=Color.fromHex"#1F77B4",Name=sprintf "%.2f" l))
|> Chart.combine
|> Chart.withYAxisStyle("",MinMax=(0.,1.))
|> Chart.withAxisTitles "$\lambda$" "$\hat \pi_0$"
|> Chart.withMathTex(true)
|> Chart.withShape minpiHatShape
|> Chart.withConfig(
    Config.init(
        Responsive=true, 
        ModeBarButtonsToAdd=[
            ModeBarButton.DrawLine
            ModeBarButton.DrawOpenPath
            ModeBarButton.EraseShape
            ]
        )
    )


open Testing.MultipleTesting

let pi0Stats = Qvalues.pi0BootstrapWithLambda [|0.0 .. 0.05 .. 0.95|] examplePVals

pi0Stats

0.3703327922077925


let qValues = Qvalues.ofPValues pi0Stats examplePVals

// show the first 5 q values
qValues.[0..4] |> Array.map string |> String.concat "; "

0.2690343536429767; 0.03451771894511998; 0.260005815044248; 0.2984261021835806; 0.08590835637088742


let qvaluesRobust = 
    Testing.MultipleTesting.Qvalues.ofPValuesRobust pi0Stats examplePVals

[
    Chart.Line(Array.sortBy fst (Array.zip examplePVals qValues),Name="qValue")
    Chart.Line(Array.sortBy fst (Array.zip examplePVals qvaluesRobust),Name="qValueRobust")
]
|> Chart.combine
|> Chart.withAxisTitles "p value" "q value"


let pi0Line = 
    Shape.init(
        ShapeType = ShapeType.Line,
        X0 = 0.,
        X1 = 1.,
        Y0 = pi0Stats,
        Y1 = pi0Stats,
        Line=Line.init(Dash=DrawingStyle.Dash)
    )

// relates the q value to each p value
Array.zip examplePVals qValues
|> Array.sortBy fst
|> Chart.Line
|> Chart.withShape pi0Line
|> Chart.withAxisTitles "p value" "q value"


let frequencyBins = 0.025 

let m = examplePVals.Length |> float

examplePVals 
|> Distributions.Frequency.create frequencyBins 
|> Map.toArray 
|> Array.map (fun (k,c) -> k,float c / frequencyBins / m) 
|> Chart.StackedColumn 
|> Chart.withTraceInfo "p values"
|> Chart.withAxisTitles "p value" "frequency density"
|> Chart.withShape pi0Line


// shows pi0 estimation in relation to lambda
//Testing.MultipleTesting.Qvalues.pi0hats [|0. .. 0.05 .. 0.96|] examplePVals
[|0. .. 0.05 .. 0.95|]
|> Array.map (fun lambda -> 
    let num =   
        examplePVals 
        |> Array.sumBy (fun x -> if x > lambda then 1. else 0.)
    let den = float examplePVals.Length * (1. - lambda)
    lambda, num/den
    )
|> Chart.Point
|> Chart.withAxisTitles @"$\lambda$" "$\hat \pi_0(\lambda)$"
|> Chart.withMathTex(true)

q values

Posted on 2021-11-18 by Benedikt Venn in Advanced

q values¶

Introduction¶

The multiple testing problem¶

False discovery rate¶

q values¶

Variants¶

Quality plots¶

Definitions and Notes¶

FAQ¶

References¶