0% found this document useful (0 votes)

8 views7 pages

Transversales Script

1. The document describes strategies for stratified two-stage cluster sampling to estimate population totals. 2. It shows how to sample primary sampling units (PSUs) in the first stage and households in the second stage. Weights are calculated for each unit. 3. Estimates, standard errors, and other statistics are then calculated from the sample data using the weights. Histograms and boxplots are presented to examine the weight distributions.

Uploaded by

marco antonio diaz barragan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views7 pages

Transversales Script

Uploaded by

marco antonio diaz barragan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

Estrategias transversales

Muestreo en dos etapas estratificado

library(dplyr)
library(TeachingSampling)
data('BigCity')
FrameI <- BigCity %>% group_by(PSU) %>%
summarise(Stratum = unique(Stratum),
Persons = n(),
Income = sum(Income),
Expenditure = sum(Expenditure))
attach(FrameI)
head(FrameI)

## # A tibble: 6 x 5
## PSU Stratum Persons Income Expenditure
## <chr> <chr> <int> <dbl> <dbl>
## 1 PSU0001 idStrt001 118 70912. 44232.
## 2 PSU0002 idStrt001 136 68887. 38382.
## 3 PSU0003 idStrt001 96 37213. 19495.
## 4 PSU0004 idStrt001 88 36926. 24031.
## 5 PSU0005 idStrt001 110 57494. 31142.
## 6 PSU0006 idStrt001 116 75272. 43473.
sizes = FrameI %>% group_by(Stratum) %>%
summarise(NIh = n(),
nIh = 2,
dI = NIh/nIh)
NIh <- sizes$NIh
nIh <- sizes$nIh
head(sizes)

## # A tibble: 6 x 4
## Stratum NIh nIh dI
## <chr> <int> <dbl> <dbl>
## 1 idStrt001 9 2 4.5
## 2 idStrt002 11 2 5.5
## 3 idStrt003 7 2 3.5
## 4 idStrt004 13 2 6.5
## 5 idStrt005 11 2 5.5
## 6 idStrt006 5 2 2.5
samI <- S.STSI(Stratum, NIh, nIh)
UI <- levels(as.factor(FrameI$PSU))
sampleI <- UI[samI]
FrameII <- left_join(sizes, BigCity[which(BigCity$PSU %in% sampleI), ], by = "Stratum")
attach(FrameII)
head(FrameII)

1
## # A tibble: 6 x 15
## Stratum NIh nIh dI HHID PersonID PSU Zone Sex Age MaritalST
## <chr> <int> <dbl> <dbl> <chr> <chr> <chr> <chr> <chr> <int> <fct>
## 1 idStrt~ 9 2 4.5 idHH~ idPer01 PSU0~ Rural Male 57 Married
## 2 idStrt~ 9 2 4.5 idHH~ idPer02 PSU0~ Rural Fema~ 48 Married
## 3 idStrt~ 9 2 4.5 idHH~ idPer03 PSU0~ Rural Male 20 Single
## 4 idStrt~ 9 2 4.5 idHH~ idPer04 PSU0~ Rural Fema~ 18 Single
## 5 idStrt~ 9 2 4.5 idHH~ idPer05 PSU0~ Rural Male 16 Single
## 6 idStrt~ 9 2 4.5 idHH~ idPer06 PSU0~ Rural Fema~ 0 <NA>
## # ... with 4 more variables: Income <dbl>, Expenditure <dbl>, Employment <fct>,
## # Poverty <fct>
HHdb <- FrameII %>%
group_by(PSU) %>%
summarise(Ni = length(unique(HHID)))
Ni <- as.numeric(HHdb$Ni)
ni <- ceiling(Ni * 0.1)
sum(ni)

## [1] 702
sam = S.SI(Ni[1], ni[1])
clusterII = FrameII[which(FrameII$PSU == sampleI[1]), ]
sam.HH <- data.frame(HHID = unique(clusterII$HHID)[sam])
clusterHH <- left_join(sam.HH, clusterII, by = "HHID")
clusterHH$dki <- Ni[1]/ni[1]
clusterHH$dk <- clusterHH$dI * clusterHH$dki
data = clusterHH
for (i in 2:length(Ni)) {
sam = S.SI(Ni[i], ni[i])
clusterII = FrameII[which(FrameII$PSU == sampleI[i]), ]
sam.HH <- data.frame(HHID = unique(clusterII$HHID)[sam])
clusterHH <- left_join(sam.HH, clusterII, by = "HHID")
clusterHH$dki <- Ni[i]/ni[i]
clusterHH$dk <- clusterHH$dI * clusterHH$dki
data1 = clusterHH
data = rbind(data, data1)
}
dim(data)

## [1] 2496 17
sum(data$dk)

## [1] 146880.9
attach(data)
estima <- data.frame(Income, Expenditure)
area <- as.factor(PSU)
stratum <- as.factor(Stratum)
hist(data$dk)

2
Histogram of data$dk
700
500
Frequency

300
100
0

0 50 100 150 200 250

data$dk
boxplot(data$dk ~ data$Stratum)
250
200
150
data$dk

100
50

idStrt001 idStrt021 idStrt041 idStrt061 idStrt081 idStrt101

data$Stratum
E.UC(stratum, area, dk, estima)

## N Income Expenditure
## Estimation 1.468809e+05 8.290466e+07 5.427982e+07
## Standard Error 3.351918e+03 4.465049e+06 2.620232e+06
## CVE 2.282065e+00 5.385764e+00 4.827267e+00
## DEFF Inf 1.145389e+01 1.355435e+01

3
Muestreo autoponderado en dos etapas estratificado

data('BigCity')
FrameI <- BigCity %>% group_by(PSU) %>%
summarise(Stratum = unique(Stratum),
Households = length(unique(HHID)),
Income = sum(Income),
Expenditure = sum(Expenditure))
attach(FrameI)
head(FrameI)

## # A tibble: 6 x 5
## PSU Stratum Households Income Expenditure
## <chr> <chr> <int> <dbl> <dbl>
## 1 PSU0001 idStrt001 26 70912. 44232.
## 2 PSU0002 idStrt001 32 68887. 38382.
## 3 PSU0003 idStrt001 24 37213. 19495.
## 4 PSU0004 idStrt001 22 36926. 24031.
## 5 PSU0005 idStrt001 28 57494. 31142.
## 6 PSU0006 idStrt001 30 75272. 43473.
sizes = FrameI %>% group_by(Stratum) %>%
summarise(NIh = n(), nIh = 2)
NIh <- sizes$NIh
nIh <- sizes$nIh
head(sizes)

## # A tibble: 6 x 3
## Stratum NIh nIh
## <chr> <int> <dbl>
## 1 idStrt001 9 2
## 2 idStrt002 11 2
## 3 idStrt003 7 2
## 4 idStrt004 13 2
## 5 idStrt005 11 2
## 6 idStrt006 5 2
resI <- S.STpiPS(Stratum, Households, nIh)
head(resI)

## [,1] [,2]
## [1,] 4 0.1774194
## [2,] 6 0.2419355
## [3,] 12 0.1717791
## [4,] 20 0.1717791
## [5,] 23 0.2553191
## [6,] 26 0.2978723
samI <- resI[, 1]
piI <- resI[, 2]
UI <- levels(as.factor(FrameI$PSU))
sampleI <- data.frame(PSU = UI[samI], dI = 1/piI)
FrameII <- left_join(sampleI, BigCity[which(BigCity$PSU %in% sampleI[,1]), ])
attach(FrameII)
head(FrameII)

4
## PSU dI HHID PersonID Stratum Zone Sex Age MaritalST
## 1 PSU0004 5.636364 idHH00042 idPer01 idStrt001 Rural Male 57 Married
## 2 PSU0004 5.636364 idHH00042 idPer02 idStrt001 Rural Female 48 Married
## 3 PSU0004 5.636364 idHH00042 idPer03 idStrt001 Rural Male 20 Single
## 4 PSU0004 5.636364 idHH00042 idPer04 idStrt001 Rural Female 18 Single
## 5 PSU0004 5.636364 idHH00042 idPer05 idStrt001 Rural Male 16 Single
## 6 PSU0004 5.636364 idHH00042 idPer06 idStrt001 Rural Female 0 <NA>
## Income Expenditure Employment Poverty
## 1 527.84 309.09 Inactive NotPoor
## 2 527.84 309.09 Inactive NotPoor
## 3 527.84 309.09 Employed NotPoor
## 4 527.84 309.09 Inactive NotPoor
## 5 527.84 309.09 Inactive NotPoor
## 6 527.84 309.09 <NA> NotPoor
HHdb <- FrameII %>%
group_by(PSU) %>%
summarise(Ni = length(unique(HHID)),
ni = 5)
Ni <- as.numeric(HHdb$Ni)
ni <- 3
head(HHdb)

## # A tibble: 6 x 3
## PSU Ni ni
## <chr> <int> <dbl>
## 1 PSU0004 22 5
## 2 PSU0006 30 5
## 3 PSU0012 28 5
## 4 PSU0020 28 5
## 5 PSU0023 24 5
## 6 PSU0026 28 5
sam = S.SI(Ni[1], ni)
clusterII = FrameII[which(FrameII$PSU == sampleI$PSU[1]), ]
sam.HH <- data.frame(HHID = unique(clusterII$HHID)[sam])
clusterHH <- left_join(sam.HH, clusterII, by = "HHID")
clusterHH$dki <- Ni[1]/ni
clusterHH$dk <- clusterHH$dI * clusterHH$dki
data = clusterHH
head(data)

## HHID PSU dI PersonID Stratum Zone Sex Age MaritalST

## 1 idHH00050 PSU0004 5.636364 idPer01 idStrt001 Rural Female 41 Separated
## 2 idHH00050 PSU0004 5.636364 idPer02 idStrt001 Rural Male 19 Single
## 3 idHH00050 PSU0004 5.636364 idPer03 idStrt001 Rural Female 16 Single
## 4 idHH20687 PSU0004 5.636364 idPer01 idStrt001 Rural Male 57 Married
## 5 idHH20687 PSU0004 5.636364 idPer02 idStrt001 Rural Female 48 Married
## 6 idHH20687 PSU0004 5.636364 idPer03 idStrt001 Rural Male 20 Single
## Income Expenditure Employment Poverty dki dk
## 1 503.92 331.92 Employed NotPoor 7.333333 41.33333
## 2 503.92 331.92 Inactive NotPoor 7.333333 41.33333
## 3 503.92 331.92 Inactive NotPoor 7.333333 41.33333
## 4 527.84 309.09 Inactive NotPoor 7.333333 41.33333
## 5 527.84 309.09 Inactive NotPoor 7.333333 41.33333
## 6 527.84 309.09 Employed NotPoor 7.333333 41.33333

5
for (i in 2:length(Ni)) {
sam = S.SI(Ni[i], ni)
clusterII = FrameII[which(FrameII$PSU == sampleI$PSU[i]), ]
sam.HH <- data.frame(HHID = unique(clusterII$HHID)[sam])
clusterHH <- left_join(sam.HH, clusterII, by = "HHID")
clusterHH$dki <- Ni[i]/ni
clusterHH$dk <- clusterHH$dI * clusterHH$dki
data1 = clusterHH
data = rbind(data, data1)
}
sum(data$dk)

## [1] 148253
dim(data)

## [1] 2585 15
attach(data)
estima <- data.frame(Income, Expenditure)
area <- as.factor(PSU)
stratum <- as.factor(Stratum)
hist(data$dk)

Histogram of data$dk
800
600
Frequency

400
200
0

0 50 100 150 200 250

data$dk
boxplot(data$dk ~ data$Stratum)

6
250
200
150
data$dk

100
50

idStrt001 idStrt021 idStrt041 idStrt061 idStrt081 idStrt101

data$Stratum
E.UC(stratum, area, dk, estima)

## N Income Expenditure
## Estimation 1.482530e+05 8.382537e+07 5.363328e+07
## Standard Error 4.056097e+03 4.551031e+06 2.262998e+06
## CVE 2.735929e+00 5.429181e+00 4.219391e+00
## DEFF Inf 7.373944e+00 7.260026e+00

Business Report Data Mining
91% (11)
Business Report Data Mining
18 pages
Answer#1: Scope of Cost Accounting:: Solve The Following Questions and Submit Your Assignment On/or Before April 15
100% (2)
Answer#1: Scope of Cost Accounting:: Solve The Following Questions and Submit Your Assignment On/or Before April 15
7 pages
Sap Product Costing Configuration Document
75% (4)
Sap Product Costing Configuration Document
16 pages
Econ 104 Proj 3
100% (1)
Econ 104 Proj 3
25 pages
Chart Patterns
100% (2)
Chart Patterns
10 pages
Etapas Script
No ratings yet
Etapas Script
6 pages
Talk 4
No ratings yet
Talk 4
35 pages
Ca09 Pitblado Handout
No ratings yet
Ca09 Pitblado Handout
28 pages
unit 3 part 2
No ratings yet
unit 3 part 2
40 pages
slidesc53_2
No ratings yet
slidesc53_2
41 pages
Cheat Sheet: Optimal Stratification
No ratings yet
Cheat Sheet: Optimal Stratification
2 pages
MIS410 Lecture1toLecture7
No ratings yet
MIS410 Lecture1toLecture7
74 pages
LR 2 Sampling
No ratings yet
LR 2 Sampling
27 pages
analysis of household survey
No ratings yet
analysis of household survey
6 pages
Socio-Economc Factors and IQ Analysis: Mawadda Hassan 2024-06-22
No ratings yet
Socio-Economc Factors and IQ Analysis: Mawadda Hassan 2024-06-22
17 pages
Lec. Note E5
No ratings yet
Lec. Note E5
7 pages
Taller Nº2 1
No ratings yet
Taller Nº2 1
16 pages
REPORT 2
No ratings yet
REPORT 2
15 pages
MIS410 Lecture1toLecture5
No ratings yet
MIS410 Lecture1toLecture5
66 pages
Times University Ranks DataSet Analysis
No ratings yet
Times University Ranks DataSet Analysis
19 pages
Lecture 5 Stratified Sampling
No ratings yet
Lecture 5 Stratified Sampling
14 pages
Decision Tree and KNN Assignment Two
No ratings yet
Decision Tree and KNN Assignment Two
13 pages
Analysis of Multiple Informant/ Multiple Source Data in Stata
No ratings yet
Analysis of Multiple Informant/ Multiple Source Data in Stata
38 pages
Socio-Economical Status of India Using Machine Learning Algorithms
No ratings yet
Socio-Economical Status of India Using Machine Learning Algorithms
10 pages
Test Bank For Interactive Statistics 3 e 3rd Edition 0131497561
100% (59)
Test Bank For Interactive Statistics 3 e 3rd Edition 0131497561
4 pages
Data Mining
100% (1)
Data Mining
6 pages
PA Univariate R Solution
No ratings yet
PA Univariate R Solution
6 pages
ML - Unit-6 KMeans
No ratings yet
ML - Unit-6 KMeans
20 pages
Sampling using R
No ratings yet
Sampling using R
3 pages
Mock Exam - Appendix
No ratings yet
Mock Exam - Appendix
15 pages
Chapter 4 - 2010
No ratings yet
Chapter 4 - 2010
13 pages
iMS_HW4_Ignoring_Dependence
No ratings yet
iMS_HW4_Ignoring_Dependence
6 pages
Stratified Randon Sampling
No ratings yet
Stratified Randon Sampling
32 pages
Lecture-9 Cluster Analysis_LAK
No ratings yet
Lecture-9 Cluster Analysis_LAK
4 pages
Stratified
No ratings yet
Stratified
17 pages
Journal of The American Statistical Association
No ratings yet
Journal of The American Statistical Association
16 pages
DMBI
No ratings yet
DMBI
16 pages
Review 2 - Full Paper - Nurul Istiqamah
No ratings yet
Review 2 - Full Paper - Nurul Istiqamah
10 pages
12
No ratings yet
12
26 pages
Survey Data Analysis in Stata: Jeff Pitblado
No ratings yet
Survey Data Analysis in Stata: Jeff Pitblado
47 pages
Introduction To Statistics - 19!3!21
No ratings yet
Introduction To Statistics - 19!3!21
47 pages
SAMPLING METHODS Group 2
No ratings yet
SAMPLING METHODS Group 2
3 pages
Since R Considers All Variables As Numeric, We Convert Them Into Factors
No ratings yet
Since R Considers All Variables As Numeric, We Convert Them Into Factors
3 pages
Stat 475 Notes 8: y B X y B X y BX N SEB NNX N X Is Unknown, Then We Substitute The Sample Mean X For It
No ratings yet
Stat 475 Notes 8: y B X y B X y BX N SEB NNX N X Is Unknown, Then We Substitute The Sample Mean X For It
13 pages
Cluster Ana
No ratings yet
Cluster Ana
12 pages
stata应用课程作图
No ratings yet
stata应用课程作图
33 pages
Introduction (Basic Definitions and Concepts) A: Population
No ratings yet
Introduction (Basic Definitions and Concepts) A: Population
8 pages
Data Wrangling
No ratings yet
Data Wrangling
12 pages
Produit Bancaire
No ratings yet
Produit Bancaire
15 pages
Data Mining Business Report 2
No ratings yet
Data Mining Business Report 2
18 pages
Survey Wss 2010
No ratings yet
Survey Wss 2010
134 pages
Introduction To Statistics - 23 - 8 - 2023
No ratings yet
Introduction To Statistics - 23 - 8 - 2023
41 pages
Software For Data Analysis and Its Applications For The Distance Courses of "PROMETHEUS"
No ratings yet
Software For Data Analysis and Its Applications For The Distance Courses of "PROMETHEUS"
29 pages
1 Pengantar Statistika
No ratings yet
1 Pengantar Statistika
22 pages
IAT Paper Jan-June 22 DMBI DIV A&B Solution
No ratings yet
IAT Paper Jan-June 22 DMBI DIV A&B Solution
10 pages
Small Area Estimation Methods, Applications and Practical Demonstration
No ratings yet
Small Area Estimation Methods, Applications and Practical Demonstration
56 pages
Tutorial Worksheet #2
No ratings yet
Tutorial Worksheet #2
2 pages
Random Sampling (Stratified) Example
No ratings yet
Random Sampling (Stratified) Example
4 pages
Part 1b
No ratings yet
Part 1b
7 pages
STA 405 FIRST MATERIAL
No ratings yet
STA 405 FIRST MATERIAL
17 pages
04 Stratified Sampling
No ratings yet
04 Stratified Sampling
19 pages
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
INTERNATIONAL FINANCE THEORY AND PRACTICE
No ratings yet
INTERNATIONAL FINANCE THEORY AND PRACTICE
3 pages
Contents of A Project Report
No ratings yet
Contents of A Project Report
4 pages
X SS Pre Board 1 2020 21
No ratings yet
X SS Pre Board 1 2020 21
13 pages
Job Description :financial AR & AP Associate
No ratings yet
Job Description :financial AR & AP Associate
2 pages
Customer Service Representative
No ratings yet
Customer Service Representative
1 page
INTD 200 - Quiz#2
No ratings yet
INTD 200 - Quiz#2
1 page
Car Lease Policy
No ratings yet
Car Lease Policy
2 pages
Asset Management: A Best Practices Guide: Purpose
No ratings yet
Asset Management: A Best Practices Guide: Purpose
4 pages
Genpact: Intelligent Enterprises Powered by Process
No ratings yet
Genpact: Intelligent Enterprises Powered by Process
11 pages
Final Brief
No ratings yet
Final Brief
2 pages
City Regions in India
100% (1)
City Regions in India
4 pages
E Marketing Function
75% (4)
E Marketing Function
10 pages
MSBP - Assignment Brief - V1.1 - Approved - 20240314
No ratings yet
MSBP - Assignment Brief - V1.1 - Approved - 20240314
15 pages
Total Outside Liability Total Liabilities: Bal-Cma
No ratings yet
Total Outside Liability Total Liabilities: Bal-Cma
4 pages
Material Costing
No ratings yet
Material Costing
21 pages
VAT Works Contracts
No ratings yet
VAT Works Contracts
149 pages
IT, ITES and Analytics
No ratings yet
IT, ITES and Analytics
70 pages
Chapter 1
No ratings yet
Chapter 1
33 pages
Industrialization During COLONIAL
No ratings yet
Industrialization During COLONIAL
8 pages
Disaster Risk Reduction AND MANAGEMENT
No ratings yet
Disaster Risk Reduction AND MANAGEMENT
21 pages
Modern Foods Industries Limited: A Case Study: Nandita Markandan & H B Soumya
No ratings yet
Modern Foods Industries Limited: A Case Study: Nandita Markandan & H B Soumya
5 pages
【Brochure】Sinoteam Logistics Co.,Ltd - China
No ratings yet
【Brochure】Sinoteam Logistics Co.,Ltd - China
9 pages
Technology Assessment Framework
No ratings yet
Technology Assessment Framework
8 pages
Nike SWOT Analy
No ratings yet
Nike SWOT Analy
11 pages
Book 4 Portfolio Management
No ratings yet
Book 4 Portfolio Management
254 pages
Marketing Assignment 1
No ratings yet
Marketing Assignment 1
3 pages
DT-UNIT-3-SLIDES_merged
No ratings yet
DT-UNIT-3-SLIDES_merged
95 pages

Transversales Script

Uploaded by

Transversales Script

Uploaded by

Estrategias transversales

Muestreo en dos etapas estratificado

0 50 100 150 200 250

idStrt001 idStrt021 idStrt041 idStrt061 idStrt081 idStrt101

## HHID PSU dI PersonID Stratum Zone Sex Age MaritalST

0 50 100 150 200 250

idStrt001 idStrt021 idStrt041 idStrt061 idStrt081 idStrt101

You might also like