• No results found

A Novel Variable Selection Method for Classification with Application to Single Nucleotide Polymorphism Data

N/A
N/A
Protected

Academic year: 2021

Share "A Novel Variable Selection Method for Classification with Application to Single Nucleotide Polymorphism Data"

Copied!
219
0
0

Loading.... (view fulltext now)

Full text

(1)
(2)
(3)
(4)
(5)
(6)
(7)
(8)
(9)
(10)
(11)
(12)
(13)
(14)
(15)
(16)
(17)

𝑋 𝑌 𝑝 𝑛 𝑛𝑔 𝑋𝑖 𝑖 𝑖 = 1,2, … , 𝑝 𝑋𝑖𝑗 𝑖 𝑗 𝑗 = 1,2, … , 𝑛 𝐷′/𝑟2 𝛽 𝜎2 𝜇 Ω 𝑘 𝑑 𝐺 = 0,1, … , 𝐺 − 1 𝑅 𝑟 = 1,2, … , 𝑅 𝑇 𝑡𝑟 = {𝑡𝑟,1, … , 𝑡𝑟,𝑛 𝑟} 𝑌𝑟 𝑦𝑟 = {𝑦𝑟,1, … , 𝑦𝑟,𝑛𝑟} 𝑌𝑆𝑁𝑃𝑖 𝑖 𝑖 = 1,2, … , 𝑝 𝑋𝑆𝑁𝑃𝑖 𝑖 𝑖 = 1,2, … , 𝑝 𝑏 𝑏 = (𝑏1, … , 𝑏𝑅) ∅𝑟 ℎ𝑟−1 𝑟

(18)

𝑥𝑟,𝑗 𝑟 𝑥𝑆𝑁𝑃𝑖,𝑗 𝑖 𝑧𝑟,𝑗 𝛼𝑟 𝑟 ℳ𝒱𝒩 𝔻 𝜔𝑞 𝑞 = 1,2, … , 𝑄 𝜑 𝜓 𝜃 𝑓 𝜋𝑔 𝕔 ℵ 𝔫 = 1,2, … , ℵ 𝐿1 𝐿2 𝜆

(19)

𝑋𝑖 𝑡 𝑖 𝑡 𝐹𝑠𝑡 𝑖 𝐹𝑠𝑡 𝐹 𝐾 = 3, 5

(20)
(21)

𝑋1, 𝑋2 𝑋3

(22)
(23)
(24)
(25)
(26)
(27)
(28)

𝑝

𝑛 (𝑝 ≫ 𝑛)

(29)
(30)
(31)

𝑡

𝑡

𝑡

(32)
(33)
(34)
(35)
(36)
(37)
(38)
(39)
(40)
(41)
(42)

𝜒2

𝑚11 𝑚12 𝑚13

(43)

𝑝 (𝑝 ≫ 𝑛)

(44)
(45)
(46)
(47)
(48)
(49)
(50)

𝑃𝑟(𝑌 = 1|𝑋) = 𝑒 𝛽0+𝛽𝑖𝑋𝑖 1 + 𝑒𝛽0+𝛽𝑖𝑋𝑖 𝛽0 𝛽1 𝑋𝑖 𝑋𝑖 𝑋𝑖, 𝑖 = 1,2, … , 𝑝

(51)

𝑋𝑖

(52)
(53)
(54)

𝑡 𝑖 𝑡 𝑔 = 0,1 𝑖 𝑡𝑖 = 𝑚𝑎𝑥 {|𝑋⃗̅𝑖𝑔− 𝑋⃗̅𝑖| 𝑀𝑔𝑆𝑖 , 𝑔 = 0,1, … , 𝐺 − 1} 𝑋⃗̅𝑖𝑔 𝑋⃗̅𝑖 𝑖 𝑔 |𝑋⃗̅𝑖𝑔− 𝑋⃗̅𝑖| 0 ⇒ 𝑋⃗𝑖(1)= {1,0,0}, ⇒ 𝑋⃗𝑖(2) = {0,1,0}, 0 ⇒ 𝑋⃗𝑖(3) = {0,0,1}. 𝑀𝑔 = √1 𝑛𝑔+ 1 𝑁 𝑆𝑖2 = 1 𝑁 − 𝐺∑ ∑ (𝑋⃗𝑖𝑗− 𝑋⃗̅𝑖𝑔) (𝑋⃗𝑖𝑗− 𝑋⃗̅𝑖𝑔) 𝑇 𝑗∈𝑔 𝐺−1 𝑔=0 𝑋⃗𝑖𝑗 𝑖 𝑗 𝑁 𝑛𝑔 𝑔 𝑆𝑖 𝑡

(55)

𝑝 𝑡 𝑡 𝑡 𝑖 𝑗 𝑛1= 1000 𝑋⃗̅𝑖1 𝑛0= 1000 𝑋⃗̅𝑖0 𝑁 = 2000 𝑋⃗̅𝑖 𝑆𝑖 𝑡 𝑡 𝑡

(56)

𝑡 𝑡 𝐹 𝑡 𝐹 (𝐹𝑠𝑡) 𝐹𝑠𝑡 = 𝑉𝑎𝑟𝑎 𝑎̅ ⋅ 𝑡̅ 𝑎̅ = ∑ 𝑎𝑔 1 𝑔=0 𝑉𝑎𝑟𝑎 = ∑(𝑎𝑔 − 𝑎̅) 2 2 1 𝑔=0 𝑎 𝑡 𝑎̅ 𝑡̅ 𝑉𝑎𝑟𝑎 𝑎𝑔 𝑔 𝐹𝑠𝑡

(57)

𝐹𝑠𝑡 𝑖 𝑗 𝑖 𝑎1 = 14 𝑡1= 543 𝑎0= 2 𝑡0 = 67 𝑁 = 2000 𝑎̅ = 16 𝑡̅ = 610 𝑉𝑎𝑟𝑎 𝑡 𝐹 𝐹

(58)
(59)
(60)
(61)
(62)

𝐿2 𝐿(𝛽0, 𝛽, 𝜆) = −𝑙(𝛽0, 𝛽) +𝜆 2 ‖𝛽‖2 2 𝑙 𝜆 𝜆 𝛽 glmnet 𝜆 𝜆 ‖𝛽‖2 𝐿2 ‖𝛽‖22 = ∑ 𝛽 𝑖2 𝑝 𝑖=1 𝛽 𝐿2 𝐿2 𝐿1

(63)

𝐿1

(64)
(65)

𝑌 = 𝑔 𝑋 = 𝑥 𝑃𝑟(𝑌 = 𝑔|𝑋 = 𝑥) =𝑃𝑟(𝑌 = 𝑔) × 𝑃𝑟(𝑋 = 𝑥|𝑌 = 𝑔) 𝑃𝑟(𝑋 = 𝑥) 𝑃𝑟(𝑌 = 𝑔) 𝑗 𝑔 𝑃𝑟(𝑋 = 𝑥) 𝑥 𝑃𝑟(𝑋 = 𝑥|𝑌 = 𝑔) 𝑋 𝑔 naïvebayes

(66)

𝑡 𝐹𝑠𝑡 𝑌 𝑋 𝑌 𝑋 𝐾 𝑥0 𝐾 𝑥0 𝑁0 𝑔 𝑔 𝑃𝑟(𝑌 = 𝑔|𝑋 = 𝑥0) = 1 𝐾∑𝑗∈𝑁0𝐼(𝑦𝑗 = 𝑔)

(67)

𝑥0 𝐾 = 1, 3, 5 class 𝐾 = 1 𝐾 = 3 𝐾 = 5 𝐾 𝐾 = 5 𝐾 = 3, 5 𝐾 = 3 𝐾 = 5 𝑡 𝐹𝑠𝑡

(68)

𝛽0+ 𝛽1𝑋1+ 𝛽2𝑋2 = 0 𝛽0, 𝛽1 𝛽2 𝑋 = (𝑋1, 𝑋2)𝑇 𝑝 𝛽0+ 𝛽1𝑋1+ 𝛽2𝑋2+ ⋯ + 𝛽𝑝𝑋𝑝= 0 𝑦𝑗 ∈ {0,1} 𝛽0+ 𝛽1𝑋𝑗1+ 𝛽2𝑋𝑗2+ ⋯ + 𝛽𝑝𝑋𝑝 > 𝑀 𝑦𝑗 = 1

(69)

𝛽0+ 𝛽1𝑋𝑗1+ 𝛽2𝑋𝑗2+ ⋯ + 𝛽𝑝𝑋𝑝 < 𝑀 𝑦𝑗 = 0 𝑗 = 1,2, … , 𝑛. 𝑀 e1071 = 𝑀 = 𝑡 𝐹𝑠𝑡

(70)

𝑔 𝑔 = 0,1 𝑝 𝑋𝑖 𝑝 𝑋1, 𝑋2, … , 𝑋𝑝 𝑗, 𝑗 = 1,2, … , 𝑛. 𝑋1 Ω Ω𝐿 Ω𝑅 Ω 𝑋1 (1) = {Ω𝐿 𝑖𝑓 𝑋𝑖 ∈ (0) Ω𝑅 𝑖𝑓 𝑋𝑖 ∈ (1,2) (2) = {Ω𝐿 𝑖𝑓 𝑋𝑖 ∈ (0,1) Ω𝑅 𝑖𝑓 𝑋𝑖 ∈ (2) (3) = {Ω𝐿 𝑖𝑓 𝑋𝑖 ∈ (0,2) Ω𝑅 𝑖𝑓 𝑋𝑖 ∈ (1) 𝑌 = 𝑔 𝑋2 Ω𝐿 𝑋3

(71)

Ω𝑅

𝑖(Ω) = 2𝑃𝑟Ω(1 − 𝑃𝑟Ω)

𝑃𝑟Ω Ω

rpart

(72)

(𝑌 = 0)

𝑡 𝐹𝑠𝑡

(73)

𝑲 = 𝟓 𝑡 𝐹𝑠𝑡 𝑲 = 𝟓 𝑡 𝐹𝑠𝑡 𝑲 = 𝟓 𝑡 𝐹𝑠𝑡 𝑲 = 𝟓 𝑡 𝐹𝑠𝑡

(74)

𝑡 𝐹

𝑡 𝐹

(75)
(76)
(77)
(78)
(79)
(80)

         

(81)

𝑆𝑁𝑅 =𝜎𝑠𝑖𝑔𝑛𝑎𝑙 2 𝜎𝑛𝑜𝑖𝑠𝑒2 𝜎𝑠𝑖𝑔𝑛𝑎𝑙2 𝜎𝑛𝑜𝑖𝑠𝑒2 𝑡 𝑡 𝑡 𝑡 𝑡 𝑡 𝑡 𝑝 𝐺 𝑡 𝑋𝑖 (𝑖 = 1,2, … , 𝑝) 𝑡

(82)

𝑡𝑖 = 𝑚𝑎𝑥 {|𝑋⃗̅𝑖𝑔− 𝑋⃗̅𝑖| 𝑀𝑔𝑆𝑖 , 𝑔 = 0,1, … , 𝐺 − 1} 𝑋⃗̅𝑖𝑔 𝑋⃗̅𝑖 𝑖 𝑔 𝑖 |𝑋⃗̅𝑖𝑔− 𝑋⃗̅𝑖| (0 ⇒ 𝑋⃗𝑖(1) = {1,0,0}, ⇒ 𝑋⃗𝑖(2) = {0,1,0}, 0 ⇒ 𝑋⃗𝑖(3)= {0,0,1}). 𝑀𝑔 = √1 𝑛𝑔+ 1 𝑁 𝑆𝑖2 = 1 𝑁 − 𝐺∑ ∑ (𝑋⃗𝑖𝑗− 𝑋⃗̅𝑖𝑔) (𝑋⃗𝑖𝑗− 𝑋⃗̅𝑖𝑔) 𝑇 𝑗∈𝑔 𝐺−1 𝑔=0 𝑋⃗𝑖𝑗 𝑖 𝑗 𝑁 𝑛𝑔 𝑔 𝑆𝑖 𝑡 𝑝 𝑡 𝑡

(83)

𝑡 𝑔( ) 𝑌 𝑋 𝑔(𝐸(𝑌|𝑋)) = 𝑋1𝛽1+ 𝑋2𝛽2 𝑋1𝛽1 𝑋2𝛽2 𝑋 = [𝑋1, 𝑋2] 𝛽 = (𝛽1, 𝛽2)𝑇 𝑋1 𝑛 × 𝑝1 𝑋2 𝑛 × 𝑝2 𝛽1 𝑝1× 1 𝛽2 𝑝2× 1 𝑝1+ 𝑝2 = 𝑝 𝛽̂𝑚𝑎𝑥 𝛽̂𝑚𝑎𝑥 ℒ(𝛽̂𝑚𝑎𝑥|𝑦) 𝛽̂ 𝛽 ℒ(𝛽̂|𝑦)

(84)

𝐷𝑒𝑣(𝑦, 𝑋, 𝛽̂) = −2 𝑙𝑜𝑔 ℒ(𝛽̂|𝑦) ℒ(𝛽̂𝑚𝑎𝑥|𝑦) 𝑆𝑁𝑅̂ =𝐷𝑒𝑣(𝑦, 𝑋1, 𝛽̂1) − 𝐷𝑒𝑣(𝑦, 𝑋, 𝛽̂) 𝐷𝑒𝑣(𝑦, 𝑋, 𝛽̂) 𝑋2 𝛽̂2 𝑋1 𝛽̂1 𝛽̂1 𝛽̂ 𝑌 𝑌 𝛽0 𝑋1 𝛽1 𝑋1𝛽1 𝑋𝑖 (𝑖 = 1,2, … , 𝑝)

(85)

𝑡𝑆𝑁𝑅̂𝑖 = 𝐷𝑒𝑣(𝑦, 𝛽̂0) − 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝐷𝑒𝑣(𝑦, 𝛽̂0) 𝛽̂0 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝛽̂0 𝛽̂𝑖 𝑋𝑖 (𝑖 = 1,2, … , 𝑝) 𝑡𝑆𝑁𝑅̂ 𝑎𝑑𝑗𝑢𝑠𝑡𝑒𝑑 =𝐷𝑒𝑣(𝑦, 𝛽̂0) − 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 𝑑0− 𝑑𝑖 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 𝑑𝑖 𝑑0 𝑑𝑖

(86)
(87)
(88)
(89)

𝑌 𝑝 𝑋𝑖 (𝑖 = 1, 2, … , 𝑝) 𝐺 𝑔 = 0,1, … , 𝐺 − 1 𝐺 = 2, 𝑔 = 1 𝑔 = 0 𝑗 (𝑗 = 1,2, … , 𝑛) 𝑔 = 1 𝑖 𝑃𝑟(𝑌𝑗 = 1|𝑋𝑖) 𝑃𝑟(𝑌𝑗 = 1|𝑋𝑖) = 𝜋𝑗 = 𝑒𝛽0+𝑋𝑖𝑗𝑇𝛽𝑖 1 + 𝑒𝛽0+𝑋𝑖𝑗𝑇𝛽𝑖 𝑃𝑟(𝑌𝑗 = 0|𝑋𝑖) = 1 − 𝜋𝑗 = 1 1 + 𝑒𝛽0+𝑋𝑖𝑗𝑇𝛽𝑖 𝑋𝑖𝑗 𝑖 𝑗 𝜃 = (𝛽0, 𝛽1, … , 𝛽𝑝) 𝑇

(90)

𝐿(𝜃) = ∑[𝑌𝑗 𝑙𝑜𝑔 𝜋𝑗+ (1 − 𝑌𝑗)𝑙𝑜𝑔(1 − 𝜋𝑗)] 𝑛 𝑗=1 𝑔(𝜃) = 𝐿(𝜃) − 𝜆 ∑|𝛽𝑖| 𝑝 𝑖=1 𝛽0 𝜆 ∑𝑝𝑖=1|𝛽𝑖| 𝜆 𝛽𝑖 glmnet 𝑘 𝑘

(91)

𝑘 𝑘 𝑘 𝜔𝑖 𝑘 𝜔𝑖 = ∑ 𝑡𝑆𝑁𝑅̂ 100 𝑘=1 𝑘 𝑘 𝛽𝑖

(92)
(93)

𝑆𝑒𝑛𝑠𝑖𝑡𝑖𝑣𝑖𝑡𝑦 = 𝑇𝑃 𝑇𝑃+𝐹𝑁 𝑆𝑝𝑒𝑐𝑖𝑓𝑖𝑐𝑖𝑡𝑦 = 𝑇𝑁 𝑇𝑁+𝐹𝑃 𝑃𝐶𝐶 = 𝑇𝑃 + 𝑇𝑁 𝑇𝑃 + 𝐹𝑁 + 𝑇𝑁 + 𝐹𝑃

(94)

𝑃𝑃𝑉 = 𝑇𝑃

𝑇𝑃+𝐹𝑃 𝑁𝑃𝑉 =

𝑇𝑁 𝑇𝑁+𝐹𝑁

(95)

𝐴𝐼𝐶 = 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 2𝑑𝑖 𝑑𝑖 𝑡𝑆𝑁𝑅̂ = 𝐷𝑒𝑣(𝑦, 𝛽̂0) 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) − 1 𝑡𝑆𝑁𝑅̂ =𝐷𝑒𝑣(𝑦, 𝛽̂0) 𝐴𝐼𝐶 − 2𝑑𝑖 − 1 𝑛

(96)

𝐵𝐼𝐶 = 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 𝑑 𝑙𝑜𝑔(𝑛)

𝑡𝑆𝑁𝑅̂ = 𝐷𝑒𝑣(𝑦, 𝛽̂0)

𝐵𝐼𝐶 − 𝑑 𝑙𝑜𝑔(𝑛)− 1

𝑅2 = 1 −𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝐷𝑒𝑣(𝑦, 𝛽̂0)

(97)
(98)
(99)
(100)

𝐺 𝐺 = 2, 𝑔 = 1 𝑔 = 0 𝑇. 𝑅 ≥ 1 𝑡𝑟 = (𝑡𝑟,1, … , 𝑡𝑟,𝑛𝑟) 𝑡𝑟,1< ⋯ < 𝑡𝑟,𝑛𝑟 𝑟 = 1, … , 𝑅 𝑅 𝑌𝑟 = (𝑌𝑟,1, … , 𝑌𝑟,𝑛𝑟) 𝑡 < 𝑇 𝑔 𝑡 𝑔 = 0 𝑔 = 1 𝑗 (𝑗 = 1, … , 𝑛𝑟) 𝑟 (𝑟 = 1, … , 𝑅) 𝑌𝑟,𝑗𝑟𝑔 {ℎ𝑟−1{𝐸(𝑌 𝑟,𝑗|𝑏, 𝑔)} = 𝑥𝑟,𝑗 𝑔𝑇 𝛼𝑟𝑔 + 𝑧𝑟,𝑗𝑔𝑇𝑏𝑟, 𝑟 = 1, … , 𝑅, 𝑗 = 1, … , 𝑛𝑟.

(101)

ℎ𝑟−1 𝑟 𝑥𝑟,𝑗𝑔 𝑧𝑟,𝑗𝑔 𝑔 𝛼𝑟𝑔 𝑟 𝑔 𝑏 = (𝑏1, … , 𝑏𝑅) 𝑏, 𝑔~ ∑ 𝜔𝑞𝑔 𝑄𝑔 𝑞=1 ℳ𝒱𝒩(𝜇𝑞𝑔, 𝔻𝑞𝑔), ℳ𝒱𝒩(𝜇, 𝔻) 𝜇 𝔻 𝜔𝑞, (𝑞 = 1, … , 𝑄) 𝑄𝑔 𝜑(∙; 𝜇, 𝔻) 𝜓𝑔: = (𝛼1𝑔, … , 𝛼𝑅𝑔, ∅1𝑔, … , ∅𝑅𝑔) 𝜃𝑔: =

(102)

(𝜔𝑔, 𝜇1𝑔, … , 𝜇𝑄𝑔𝑔, 𝔻1𝑔, … , 𝔻𝑄𝑔𝑔) 𝑌𝑟 𝑌𝑆𝑁𝑃𝑖, (𝑖 = 1,2, … 𝑝) 𝑌𝑆𝑁𝑃𝑖 𝑌𝑆𝑁𝑃𝑖1 𝑌𝑆𝑁𝑃𝑖2 𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃11 𝑌𝑆𝑁𝑃12

(103)

𝑥𝑟,𝑗𝑔 {ℎ𝑟 −1{𝐸(𝑌 𝑟,𝑗|𝑏, 𝑔)} = 𝑥𝑟,𝑗 𝑔𝑇 𝛼𝑟𝑔+ 𝑧𝑟,𝑗𝑔𝑇𝑏𝑟, 𝑟 = 1, … , 𝑅, 𝑗 = 1, … , 𝑛𝑟 ℎ𝑆𝑁𝑃−1 𝑖{𝐸(𝑌𝑆𝑁𝑃𝑖,𝑗|𝑔)} = 𝑥𝑆𝑁𝑃𝑖,𝑗 𝑔𝑇 𝛼𝑆𝑁𝑃 𝑖 𝑔 , 𝑖 = 1, … , 𝑝, 𝑗 = 1, … , 𝑛𝑆𝑁𝑃𝑖 𝑅 𝑥𝑟,𝑗𝑔𝑇 = (𝑥𝑟,𝑗𝑔𝑇, 𝑋𝑆𝑁𝑃 𝑖,𝑗 𝑔𝑇 , … , 𝑋𝑆𝑁𝑃 𝑝,𝑗 𝑔𝑇 ).

(104)

𝑋𝑆𝑁𝑃 11,𝑗 𝑔 𝑋𝑆𝑁𝑃 12,𝑗 𝑔 𝜓𝑔 𝜃𝑔 𝑔 𝑃𝑟𝑔,𝑛𝑒𝑤 = 𝜋𝑔𝑓̂𝑔,𝑛𝑒𝑤 ∑𝐺−1𝑔̌=0𝜋𝑔̃𝑓̂𝑔̃,𝑛𝑒𝑤 𝑔 = 0, … , 𝐺 − 1, 𝑓̂ 𝜋𝑔 = 𝑃𝑟(𝑔), 𝑔 = 0, … , 𝐺 − 1 𝑓𝑔,𝑛𝑒𝑤

(105)

ℵ 𝑓𝑔,𝑛𝑒𝑤 𝑓𝑔,𝑛𝑒𝑤 𝑌𝑛𝑒𝑤 = (𝑦𝑛𝑒𝑤,1, … , 𝑦𝑛𝑒𝑤,𝑅) 𝑓𝑔,𝑛𝑒𝑤 𝑌𝑛𝑒𝑤 𝑓𝑔,𝑛𝑒𝑤 𝑌𝑛𝑒𝑤 𝑓𝑔,𝑛𝑒𝑤

(106)

𝑔 = 0 𝑔 = 1

(107)
(108)
(109)
(110)
(111)

glm

(112)
(113)

glmnet

(114)
(115)
(116)

0 50 100 150 200 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on univariate tSNR ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(117)
(118)
(119)
(120)
(121)
(122)

0 50 100 150 200 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on cumulative tSNR ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(123)
(124)
(125)
(126)
(127)
(128)
(129)
(130)
(131)
(132)
(133)
(134)
(135)

𝑋𝑖 , 𝑖 = 1,2, … , 𝑝 𝑡𝑆𝑁𝑅̂𝑖 𝑡𝑆𝑁𝑅̂𝑖 = 𝐷𝑒𝑣(𝑦, 𝛽̂0) − 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝐷𝑒𝑣(𝑦, 𝛽̂0) 𝛽̂0 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) 𝛽̂0 𝛽̂𝑖 𝑖 𝑋𝑖 (𝑖 = 1,2, … , 𝑝)

(136)
(137)

n = 1,212

n = 303 𝑘

(138)

𝜔𝑖 𝑘 𝜔𝑖 = ∑ 𝑡𝑆𝑁𝑅̂ 100 𝑘=1 𝑋1, 𝑋2 𝑋3 𝑘 𝑋1 𝑋2 𝑋3 𝑋1+ 𝑋2+ 𝑋3 𝑋1 𝑋1+ 𝑋2 𝑋2+ 𝑋3 𝜔𝑖 𝜔1 𝜔2 𝜔3

(139)

𝑡𝑆𝑁𝑅̂ 𝑎𝑑𝑗𝑢𝑠𝑡𝑒𝑑 =𝐷𝑒𝑣(𝑦, 𝛽̂0) − 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 𝑑0− 𝑑𝑖 𝐷𝑒𝑣(𝑦, 𝑋𝑖, 𝛽̂𝑖) + 𝑑𝑖 𝑑0 𝑑𝑖 𝑘 𝑘 𝛽𝑖

(140)
(141)
(142)
(143)
(144)

0 10 20 30 40 50 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on univariate tSNR ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity 0 10 20 30 40 50 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on univariate tSNR ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(145)

glmnet

𝜆

(146)
(147)

0 10 20 30 40 50 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on cumulative tSNR ranking

C la s s ifi c a tio n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(148)

0 50 100 150 200 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on cumulative tSNR ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity 0 50 100 150 200 0 1 2 3 4 5

Number of SNPs in the model based on cumulative tSNR ranking

A d ju s te d t S N R

(149)
(150)
(151)
(152)

(𝑛 = 639) (𝑛 = 1,515)

(153)
(154)
(155)
(156)
(157)
(158)
(159)
(160)

           

(161)
(162)
(163)
(164)
(165)

0 500 1000 1500 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0 Time (days) S e iz u re s Remission 0 500 1000 1500 0 2 4 6 8 10 Time (days) lo g (1 + T o ta l S e iz u re s ) Remission 0 500 1000 1500 0 1 2 3 4 5 6 Time (days) N u m b e r o f A d v e rs e E v e n ts Remission 0 500 1000 1500 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0 Time (days) S e iz u re s Refractory 0 500 1000 1500 0 2 4 6 8 10 Time (days) lo g (1 + T o ta l S e iz u re s ) Refractory 0 500 1000 1500 0 1 2 3 4 5 Time (days) N u m b e r o f A d v e rs e E v e n ts Refractory

(166)

mixAK 𝑗 (𝑗 = 1, … , 𝑛𝑟) 𝑟 (𝑟 = 1, … , 𝑅) 𝑌𝑟,𝑗 𝑔 𝑏 ∅𝑟𝑔 ℎ𝑟−1{𝐸(𝑌𝑟,𝑗|𝑏, 𝑈 = 𝑔)} = 𝑥𝑟,𝑗𝑔𝑇𝛼𝑟𝑔 + 𝑧𝑟,𝑗𝑔𝑇𝑏𝑟 𝑟 = 1, … , 𝑅, 𝑗 = 1, … , 𝑛𝑟 𝑅 = 3 𝐸(𝑌1,𝑗|𝑏, 𝑈 = 1) = ℎ1−1(𝑥1,𝑗 𝑔𝑇 𝛼1𝑔+ 𝑧1,𝑗𝑔𝑇𝑏1) 𝐸(𝑌2,𝑗|𝑏, 𝑈 = 1) = ℎ2−1(𝑥2,𝑗𝑔𝑇𝛼2𝑔+ 𝑧2,𝑗𝑔𝑇𝑏2) 𝐸(𝑌3,𝑗|𝑏, 𝑈 = 1) = ℎ3−1(𝑥 3,𝑗 𝑔𝑇 𝛼3𝑔+ 𝑧3,𝑗𝑔𝑇𝑏3) 𝐸(𝑌1,𝑗|𝑏, 𝑈 = 0) = ℎ1−1(𝑥1,𝑗𝑔𝑇𝛼1𝑔+ 𝑧1,𝑗𝑔𝑇𝑏1) 𝐸(𝑌2,𝑗|𝑏, 𝑈 = 0) = ℎ2−1(𝑥 2,𝑗 𝑔𝑇 𝛼2𝑔+ 𝑧2,𝑗𝑔𝑇𝑏2) 𝐸(𝑌3,𝑗|𝑏, 𝑈 = 0) = ℎ3−1(𝑥3,𝑗𝑔𝑇𝛼3𝑔+ 𝑧3,𝑗𝑔𝑇𝑏3) 𝑥𝑟,𝑗𝑔

(167)

𝑧𝑟,𝑗𝑔 = 1 𝑏 = (𝑏1, 𝑏2, 𝑏3)𝑇 𝑔 𝑃𝑟𝑔,𝑛𝑒𝑤 = 𝜋𝑔𝑓̂𝑔,𝑛𝑒𝑤 ∑𝐺−1𝑔̌=0𝜋𝑔̃𝑓̂𝑔̃,𝑛𝑒𝑤 𝑔 = 0, … , 𝐺 − 1, 𝑓̂ 𝜋𝑔 = 𝑃𝑟(𝑔), 𝑔 = 0, … , 𝐺 − 1 𝑓𝑔,𝑛𝑒𝑤 ℵ coda 𝛼𝑟𝑔 ∅𝑟𝑔 𝑓𝑔,𝑛𝑒𝑤

(168)

𝑌𝑛𝑒𝑤 = (𝑦𝑛𝑒𝑤,1, … , 𝑦𝑛𝑒𝑤,𝑅) 𝑓𝑔,𝑛𝑒𝑤 𝑌𝑛𝑒𝑤 𝑏𝑛𝑒𝑤 𝕔 𝕔 𝑌𝑟

(169)

𝑋𝑟 𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃2 {ℎ𝑟 −1{𝐸(𝑌 𝑟,𝑗|𝑏, 𝑔)} = 𝑥𝑟,𝑗 𝑔𝑇 𝛼𝑟𝑔+ 𝑧𝑟,𝑗𝑔𝑇𝑏𝑟, 𝑟 = 1, … , 𝑅, 𝑗 = 1, … , 𝑛𝑟𝑆𝑁𝑃−1 𝑖{𝐸(𝑌𝑆𝑁𝑃𝑖,𝑗|𝑔)} = 𝑥𝑆𝑁𝑃 𝑖,𝑗 𝑔𝑇 𝛼𝑆𝑁𝑃 𝑖 𝑔 , 𝑖 = 1, … , 𝑝, 𝑗 = 1, … , 𝑛𝑆𝑁𝑃𝑖 𝑋𝑆𝑁𝑃1 𝑋𝑆𝑁𝑃2 𝑅 𝑥𝑟,𝑗𝑔𝑇 = (𝑥𝑟,𝑗𝑔𝑇, 𝑋𝑆𝑁𝑃 𝑖,𝑗 𝑔𝑇 , … , 𝑋𝑆𝑁𝑃 𝑝,𝑗 𝑔𝑇 ).

(170)

𝑌𝑆𝑁𝑃𝑖 𝑋𝑆𝑁𝑃𝑖

(171)
(172)
(173)
(174)
(175)

0 50 100 150 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on weightage ranking

C la s s ifi c a tio n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(176)

0 50 100 150 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on weightage ranking

C la s s ifi c a tio n p e rf o rm a n c e 0 1 2 3 4 5 6 A d ju s te d t S N R 0 50 100 150 0 .0 0 .2 0 .4 0 .6 0 .8 1 .0

Number of SNPs in the model based on weightage ranking

C la s s if ic a ti o n p e rf o rm a n c e PCC AUC NPV PPV Sensitivity Specificity

(177)
(178)
(179)

𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃2 𝑋𝑆𝑁𝑃1 𝑋𝑆𝑁𝑃2 𝑋𝑆𝑁𝑃1 + 𝑋𝑆𝑁𝑃2 𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃2 𝑌𝑆𝑁𝑃1 + 𝑌𝑆𝑁𝑃2 𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃1+ 𝑌𝑆𝑁𝑃2 𝑋𝑆𝑁𝑃1+ 𝑋𝑆𝑁𝑃2

(180)

𝑥𝑆𝑁𝑃1 𝑥𝑆𝑁𝑃2 + 𝑥𝑥𝑆𝑁𝑃1

𝑆𝑁𝑃2

𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃2 + 𝑌𝑌𝑆𝑁𝑃1

𝑆𝑁𝑃2

(181)

𝑌𝑆𝑁𝑃1 𝑌𝑆𝑁𝑃2

𝑌𝑆𝑁𝑃1 + 𝑌𝑆𝑁𝑃2

(182)
(183)
(184)
(185)
(186)
(187)
(188)
(189)
(190)
(191)
(192)
(193)
(194)
(195)
(196)
(197)
(198)
(199)
(200)

References

Related documents

interviews confirmed the results drawn from the questionnaire study: the students mostly depended on books as primary source of knowledge, liked peer discussion, mind

Sahin and Chamkha [15] analyzed the effects of radiation and chemical reaction on steady mixed convective heat and mass transfer flow of an optically thin gray gas

identify and exclude deaths potentially attributable to neonatal tetanus or congenital malformations (con- firmed through direct physician [Drs Adhikari and Kha- try] assessment

CUAJ ? Review Danielson et al Management of non metastatic prostate cancer Management algorithms for prostate specific antigen progression in prostate cancer Biochemical recurrence

Int J D , mu\ ~O 557 566 (19961 557 Original Arliel,' Activation of an 85 kDa ribosomal 56 kinase during serotonin induced oocyte maturation YVES DUROCHER' and PIERRE GUERRIER Ecole

 Perform uncertainty quantification analysis for ring gyroscope based on output response. statistics in time domain as well as in the frequency domain for varying

controlled, multicenter, multinational Phase II study, Traverso et al assessed the duration and stability of the IOP-lowering effect and tolerability of