From a2fec9c87d8a687f88744b46261d10e447ef882d Mon Sep 17 00:00:00 2001 From: corentinchoisy Date: Mon, 25 Mar 2024 13:32:51 +0100 Subject: [PATCH] Split ROSALI analysis in 20 files --- .../scénarios/pcm_dif_rosali_S1.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S10.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S11.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S12.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S13.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S14.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S15.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S16.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S17.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S18.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S19.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S2.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S20.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S3.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S4.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S5.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S6.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S7.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S8.do | 364 ++++++++++++++++++ .../scénarios/pcm_dif_rosali_S9.do | 364 ++++++++++++++++++ 20 files changed, 7280 insertions(+) create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S1.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S10.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S11.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S12.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S13.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S14.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S15.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S16.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S17.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S18.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S19.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S2.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S20.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S3.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S4.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S5.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S6.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S7.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S8.do create mode 100644 Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S9.do diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S1.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S1.do new file mode 100644 index 0000000..564b235 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S1.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "1" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S10.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S10.do new file mode 100644 index 0000000..71ececc --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S10.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "10" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S11.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S11.do new file mode 100644 index 0000000..d20bc42 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S11.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "11" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S12.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S12.do new file mode 100644 index 0000000..c6a392d --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S12.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "12" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S13.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S13.do new file mode 100644 index 0000000..ff9a7e8 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S13.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "13" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S14.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S14.do new file mode 100644 index 0000000..1a584e4 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S14.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "14" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S15.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S15.do new file mode 100644 index 0000000..9611f26 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S15.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "15" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S16.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S16.do new file mode 100644 index 0000000..74fdc63 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S16.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "16" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S17.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S17.do new file mode 100644 index 0000000..218bc08 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S17.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "17" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S18.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S18.do new file mode 100644 index 0000000..eb63617 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S18.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "18" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S19.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S19.do new file mode 100644 index 0000000..a58cb17 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S19.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "19" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S2.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S2.do new file mode 100644 index 0000000..5d96e1c --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S2.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "2" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S20.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S20.do new file mode 100644 index 0000000..82cdd40 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S20.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "20" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S3.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S3.do new file mode 100644 index 0000000..6b353a7 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S3.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "3" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S4.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S4.do new file mode 100644 index 0000000..f00f747 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S4.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "4" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S5.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S5.do new file mode 100644 index 0000000..7223c34 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S5.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "5" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S6.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S6.do new file mode 100644 index 0000000..ba0d7f1 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S6.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "6" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S7.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S7.do new file mode 100644 index 0000000..abdbd90 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S7.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "7" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S8.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S8.do new file mode 100644 index 0000000..52a3e1a --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S8.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "8" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +} diff --git a/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S9.do b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S9.do new file mode 100644 index 0000000..c1525e7 --- /dev/null +++ b/Scripts/Analysis/DIF-ROSALI/scénarios/pcm_dif_rosali_S9.do @@ -0,0 +1,364 @@ +*================================================================================================================================================= +* Date : 2024-01-23 +* Stata version : Stata 18 SE +* +* This program analyses simulated data accounting for DIF through a partial credit model +* +* ado-files needed : - pcm, rosali (version 5.5 October 25, 2023, available on gitea) +* +* +*================================================================================================================================================ +adopath+"/home/corentin/Documents/These/Recherche/ROSALI-SIM/Modules/rosali_custom" + + +local N = "50 100 200 300" + local ss = "9" + foreach s in `ss' { + foreach Nnn in `N' { + local Nn = `Nnn' + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/DIF/N`Nn'" + if (`s'<=4) { + local path_data = "/home/corentin/Documents/These/Recherche/Simulations/Data/NoDIF/N`Nn'" + } + local path_res = "/home/corentin/Documents/These/Recherche/Simulations/Analysis/ROSALI-DIF/N`Nn'" + local scenarios = "A B C D E F G" + foreach scen in `scenarios' { + clear + import delim "`path_data'/scenario_`s'`scen'_`Nn'.csv", encoding(ISO-8859-2) case(preserve) clear + rename TT tt + + if (`s'<=2) { + local nbitems=4 + } + else if (`s'<=4) { + local nbitems=7 + } + else if (`s'<=12) { + local nbitems=4 + } + else { + local nbitems=7 + } + +if (mod(`s',2)==0) { + local nbmoda=3 +} +else { + local nbmoda=1 +} + + if (`s'<=4) { + local nbdif=0 + } + else if (`s'<=8) { + local nbdif=1 + } + else if (`s'<=16) { + local nbdif=2 + } + else { + local nbdif=3 + } + * taillemat = Maximum J*M cases pour les items par et J*M cases pour les dif par + J cases pour les DIF detect + nbdif cases pour dif réel + local taillemat=2*`nbitems'*`nbmoda'+`nbitems'+`nbdif'+2 + local colna="" + forvalues i=1/`nbitems' { + forvalues z=1/`nbmoda' { + local colna = "`colna'"+"item`i'_`z' " + local colna = "`colna'"+"dif_`i'_`z' " + } + } + forvalues i=1/`nbitems' { + local colna = "`colna'"+"dif_detect_`i' " + } + + forvalues i=1/`nbdif' { + local colna = "`colna'"+"real_dif_`i' " + } +local colna = "`colna'" + "beta " + "se_beta" + + + mat outmat = J(1000,`taillemat',.) + mat colnames outmat= `colna' + di "Scenario `s'`scen' / N=`Nnn'" + forvalues k=1/1000 { + if (mod(`k',100)==0) { + di "`k'/1000" + } + preserve + qui keep if replication==`k' + + + * MERGE des modalités si non représentées + + if (`nbmoda'>1 & `Nn'==50) { + local com_z = 0 + qui gen comz = 0 + forvalues j = 1 / `nbitems' { + local recoda_`j' = 0 + qui tab item`j' if tt == 0, matrow(rect1_g0_`j') matcell(nbrt1_g0_`j') + local maxm`j'_t1_g0 = rect1_g0_`j'[r(r),1] + local minm`j'_t1_g0 = rect1_g0_`j'[1,1] + + qui tab item`j' if tt == 1, matrow(rect1_g1_`j') matcell(nbrt1_g1_`j') + local minm`j'_t1_g1 = rect1_g1_`j'[1,1] + local maxm`j'_t1_g1 = rect1_g1_`j'[r(r),1] + + local minm_`j' = min(`minm`j'_t1_g0',`minm`j'_t1_g1') + local maxm_`j' = max(`maxm`j'_t1_g0',`maxm`j'_t1_g1') + local nbm_`j' = `=`maxm_`j''-`minm_`j''' + + if `minm_`j'' != 0 & `com_z' == 0 { + local com_z = 1 + } + + qui count if item`j' == 3 & tt == 0 + local mod3plac = r(N) + qui count if item`j' == 3 & tt == 1 + local mod3tt = r(N) + local nb_rn3 = min(`mod3plac',`mod3tt') + if `nb_rn3'==0 { + qui replace comz = 1 + } + + forvalues m = 0/`=`nbm_`j''-1' { + qui count if item`j' == `m' & tt == 0 + local nb_rn1_g0 = r(N) + qui count if item`j' == `m' & tt == 1 + local nb_rn1_g1 = r(N) + local nb_rn = min(`nb_rn1_g0',`nb_rn1_g1') + if `nb_rn' == 0 { + qui replace comz = 1 + local recoda_`j' = 1 + if `m' == 0 | `m' < `minm`j'_t1_g0' | `m' < `minm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'+`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'+`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else if `m' == `=`nbm_`j''-1' | `m' >= `maxm`j'_t1_g1' { + local stop = 1 + forvalues kk = 1/`=`m'' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m' - `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `=`m' - `kk'' if item`zzz'==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + if runiform()>0.5{ + local stop = 1 + forvalues kk = 1/`m' { + qui count if item`j' == `=`m' - `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' - `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0 { + qui replace item`j'= `=`m'-`kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m'-`kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + else { + local stop = 1 + forvalues kk = 1/`=`nbm_`j''-`m'' { + qui count if item`j' == `=`m' + `kk'' & tt == 0 + local v`kk'1_0 = r(N) + qui count if item`j' == `=`m' + `kk'' & tt == 1 + local v`kk'1_1 = r(N) + if (`v`kk'1_0' != 0 | `v`kk'1_1' != 0) & `stop' != 0{ + qui replace item`j'=`=`m' + `kk'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'=`=`m' + `kk'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + else { + if `stop' != 0 { + qui replace item`j'= `nbm_`j'' if item`j'==`m' + local zzz=`j'+`nbitems' + *qui replace item`zzz'= `nbm_`j'' if item``=`j'+`nbitems'''==`m' + *di "WARNING SCENARIO `k': items `j': answers `m' and `=`m'+`kk'' merged" + local stop = 0 + } + } + } + } + } + } + } + qui levelsof item`j' + local val = r(levels) + local checker: word 1 of `val' + local checker2: word 2 of `val' + local checker3: word 3 of `val' + local nummoda=r(r) + local nbmoda_`j'=`nummoda' + if (`nummoda'==2) { + qui recode item`j' (`checker'=0) (`checker2'=1) + } + if (`nummoda'==3) { + if (`checker'!=0) { + qui recode item`j' (`checker'=0) (`checker2'=1) (`checker3'=2) + } + else if (`checker2'!=1) { + qui recode item`j' (`checker2'=1) (`checker3'=2) + } + else if (`checker3'!=2) { + qui recode item`j' (`checker3'=2) + } + } + } + + qui valuesof comz + local val = r(values) + local checker: word 1 of `val' + } + else { + forvalues jj=1/`nbitems' { + local nbmoda_`jj'=`nbmoda' + } + } + + + * ROSALI + qui rosali_original item1-item`nbitems' item1-item`nbitems', group(tt) + qui mat resmat=r(difitems) + local nbitems2 = 2*`nbitems' + + * Calculer le nbre d'items détectés + local nbdetect = 0 + local stop = 0 + forvalues jj=1/`nbitems' { + if (`stop'==0) { + mat testm=J(1,1,.) + if (resmat[1,`jj']==testm[1,1]) { + local stop = 1 + local nbdetect = `jj'-1 + } + } + } + + * Stocker les items détectés + + * Définition des contraintes + local csrt=0 + mat testm=J(1,1,0) + forvalues u=1/`nbdetect' { + local difitems`u'=resmat[1,`u'] + local i=`difitems`u'' + if (`nbmoda_`i''==3 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + local v=`u'+100 + local constrnt`u'_2 = "constraint `v' 3*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([3.item`i']_cons-([3.item`i']_cons+[3.item`i'] tt))" + qui `constrnt`u'_2' + } + if (`nbmoda_`i''==2 & resmat[1,`nbitems'+`i']!=testm[1,1]){ + local constrnt`u' = "constraint `u' 2*([1.item`i']_cons-([1.item`i']_cons+[1.item`i'] tt))=([2.item`i']_cons-([2.item`i']_cons+[2.item`i'] tt))" + qui `constrnt`u'' + } + } + + * Définition du modèle + local mod "gsem " + local conformula = "" + forvalues i=1/`nbitems' { + local mod = "`mod'"+"(1.item`i'<-THETA@1)" + if (`nbmoda_`i''==3) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)(3.item`i'<-THETA@3)" + } + else if (`nbmoda_`i''==2) { + local mod = "`mod'"+"(2.item`i'<-THETA@2)" + } + } + forvalues u=1/`nbdetect' { + local v=`difitems`u'' + local mod = "`mod'"+"(1.item`v'<-THETA@1 tt)" + if (`nbmoda_`v''==3) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)(3.item`v'<-THETA@3 tt)" + } + else if (`nbmoda_`v''==2) { + local mod = "`mod'"+"(2.item`v'<-THETA@2 tt)" + } + local w= 100+`u' + if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==3) { + local conformula = "`conformula'" + "`u' " + "`w' " + } + else if (resmat[1,`nbitems'+`v']!=testm[1,1] & `nbmoda_`v''==2) { + local conformula = "`conformula'" + "`u' " + } + } + if ("`conformula'" != "") { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent constraint(`conformula')" + } + else { + local mod = "`mod'" + "(THETA<-tt), mlogit tol(0.01) iterate(500) latent(THETA) nocapslatent" + } + *calcul du modèle + qui `mod' + mat V=r(table) + mat W=V[1..2,1...] + + * compilation + forvalues j=1/`nbitems' { + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"item`j'_`z'")] = W[1,colnumb(W,"`z'.item`j':_cons")] + } + } + * compilation DIF + forvalues u=1/`nbdetect' { + local j=`difitems`u'' + forvalues z=1/`nbmoda_`j'' { + mat outmat[`k',colnumb(outmat,"dif_`u'_`z'")] = W[1,colnumb(W,"`z'.item`j':tt")] + mat outmat[`k',colnumb(outmat,"dif_detect_`u'")] = `j' + } + } + + * Stocker les items de DIF originaux + if (`nbdif' > 0) { + qui levelsof dif1 + local ldif1 = r(levels) + local diff1: word 1 of `ldif1' + qui mat outmat[`k',colnumb(outmat,"real_dif_1")]=`diff1' + if (`nbdif' > 1) { + qui levelsof dif2 + local ldif2 = r(levels) + local diff2: word 1 of `ldif2' + qui mat outmat[`k',colnumb(outmat,"real_dif_2")]=`diff2' + if (`nbdif' > 2) { + qui levelsof dif3 + local ldif3 = r(levels) + local diff3: word 1 of `ldif3' + qui mat outmat[`k',colnumb(outmat,"real_dif_3")]=`diff3' + } + } + } + qui mat outmat[`k',colnumb(outmat,"beta")]=W[1,colnumb(W,"THETA:tt")] + qui mat outmat[`k',colnumb(outmat,"se_beta")]=W[2,colnumb(W,"THETA:tt")] + restore + } + putexcel set "`path_res'/`s'`scen'_`Nn'_original.xls", sheet("outmat") replace + putexcel A1=matrix(outmat), colnames +} +} +}