-
Notifications
You must be signed in to change notification settings - Fork 1
/
medical.tex
163 lines (139 loc) · 5.58 KB
/
medical.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
%%%
% Tech report template. Compile with pdflatex
%%%
%\documentclass[pdftext,twoside,12pt]{report}
\documentclass[pdftext,twoside,11pt]{article}
\usepackage[a4paper,lmargin=2.5cm,rmargin=2cm,tmargin=1cm,bmargin=1cm,includehead,includefoot]{geometry}
\usepackage[german,english]{babel}
\usepackage{url}
\usepackage{subfig}
\usepackage{fancyhdr}
\usepackage{caption}
\usepackage{array}
\usepackage{amsmath} % needed for subequations
\usepackage{amssymb}
\usepackage{marvosym} % for the Euro symbol
\usepackage{mathptmx}
\usepackage{multirow}
\usepackage[small,compact]{titlesec} %for compressed Section titles
\usepackage{mdwlist} %for compressed itemized lists
\usepackage{setspace} %for chaging spacing in environments (see biblio)
\usepackage[numbers,sort&compress]{natbib}
\usepackage[scaled=.90]{helvet}
\usepackage{times}
\usepackage[T1]{fontenc}
%\usepackage[latin1]{inputenc}
\usepackage[utf8]{inputenc}
\usepackage{graphicx}
\usepackage{pgf}
\usepackage{hypernat}
\usepackage{hyperref}
%%% Package options %%%
\hypersetup{colorlinks=true, breaklinks=true, pagebackref=true,
urlcolor=blue, linkcolor=blue,anchorcolor=blue,citecolor=blue,
pdfpagemode = UseNone, %FullScreen, %UseThumbs, %UseOutlines,
pdfauthor = {},
pdftitle = {},
pdfsubject = {},
pdfkeywords = {}
}
\DeclareGraphicsExtensions{.jpg,.pdf,.mps,.png}
\graphicspath{{img/} {./}} %put all figures in these dirs
\urlstyle{rm} %so it doesn't use a typewriter font for urls.
%\newcommand{\bibfont}{\scriptsize} %for smaller fonts in biblio
\renewcommand{\captionfont}{\small \sffamily}
\renewcommand\floatpagefraction{.9}
\renewcommand\topfraction{.9}
\renewcommand\bottomfraction{.9}
\renewcommand\textfraction{.1}
\setlength{\bibsep}{1pt} %for compressed itemized list on biblio
\setlength{\topsep}{0pt}
\setlength{\itemsep}{0pt}
\setlength{\partopsep}{0pt}
\setcounter{totalnumber}{50}
\setcounter{topnumber}{50}
\setcounter{bottomnumber}{50}
%Example of image declaration (declared once in pdf file, reduces file size)
%\pgfdeclareimage[height=0.8cm]{logo}{img/logo}
%Use with:
%\pgfuseimage{logo}
% Headers and Footers
\pagestyle{fancy}
\fancyhead{} % reset headers
\fancyfoot{} % reset footers
\fancyhead[LO]{\textsf{\textbf{TITLE}}}
\fancyhead[CO]{\date{\today}}
\fancyhead[RO]{AUTHOR}
% remove horizontal lines between text and headers and footers
\renewcommand{\footrulewidth}{0pt}
\renewcommand{\headrulewidth}{0pt}
% Title page
\title{A Review of Recent Research in Extracting Information From Medical Textual Documents}
\author{AUTHOR\\
University of Florida\\
}
\date{\today}
\begin{document}
%\thispagestyle{empty}
\maketitle
% keywords
% Use with {report} documentclass
% \chapter{The beginning}
% \label{cha:beginning}
%----------------------------------------------------------%
\section{Automated identification of extreme-risk events in clinical incident reports}
\label{sec:intro}
\begin{itemize}
\item Objectives: classification problem
\item Methods: Naive Bayes and Support Vector Machine.
\item Result assessments: precision,recall,F-measure,AUC.
\item Feature extraction: Punctuation removed, converted to lower case,'bags of words'
\item Input representation: binary,term-frequency, thresholding,tf-idf
\item Feature selection: excluding words in similar frequency(dimensionality reduction)
excluding determiners, prepositions, pronouns, conjunctions(pos tagging)
stemming, bigrams.
\item Training and validating the classifiers: Naive Bayes, SVM(linear,Polynomial,RBF), 10-fold cross-validation.
\end{itemize}
\section{Extracting Information from Textual Documents
in the Electronic Health Record:A Review of Recent Research.}
\label{sec:intro}
\begin{itemize}
\item Spell checking, word sense disambiguation(?), POS, Contextual features like negation, temporarily, and subject identification.
\item Automatic de-identification uses the extraction of personal information before its removal. Rule-based NER.
\item Contextual Feature Detection and Analysis.
Negation(e.g. “denies any chest pain”) temporarily(e.g. “fracture of the tibia 2 years ago”). Event subject identification(e.g. “his mother has diabetes”).
NegExpanding,NegEx,Negfinder: a program detecting negation terms
TimeText detected temporal relations.
\end{itemize}
\section{UMLS project}
\label{sec:intro}
\begin{itemize}
\item The UMLS project is an effort to overcome two significant
barriers to effective retrieval of machine-readable information.
\item The first is the variety of ways the same concepts are expressed
in different machine-readable sources and by different people. disparate databases and systems.
\end{itemize}
\section{Automated systems to identify relevant
documents in product risk management}
\label{sec:intro}
\begin{itemize}
\item logistic regression, K-nearest neighbour, Naive Bayes, SVM
\item Word occurrence, Binary frequence, TF-IDF.
\item stemming, remove prepositions, indentify acronums, synonyms obtained from Omniviz.
\end{itemize}
\section{De-Indentification}
\label{sec:intro}
\begin{itemize}
\item Patient's and doctor's first and last names
\item Id numbers, Phone, fax, pager numbers, Hospital names, Geographic locations, Dates, Ages above 90
\end{itemize}
features of the text used in de-identification
\begin{itemize}
\item Target word to be classified
\item Words up to 2 words left/right of target
\item Target part of speech
\item Target capitalization
\item Target length and others.
\end{itemize}
%----------------------------------------------------------%
\end{document}