Converted to AsciiDoc
This commit is contained in:
parent
ada1aca49b
commit
e836ecfd7c
45 changed files with 0 additions and 21077 deletions
|
@ -1,3 +0,0 @@
|
|||
This directory contains Relax NG Compact schema files, for use with
|
||||
Emacs. These files were download from http://www.docbook.org/rng/4.5/
|
||||
on 2012-07-16.
|
|
@ -1,164 +0,0 @@
|
|||
# ......................................................................
|
||||
|
||||
# DocBook CALS Table Model V4.5 ........................................
|
||||
|
||||
# File calstblx.mod ....................................................
|
||||
|
||||
# Copyright 1992-2002 HaL Computer Systems, Inc.,
|
||||
# O'Reilly & Associates, Inc., ArborText, Inc., Fujitsu Software
|
||||
# Corporation, Norman Walsh, Sun Microsystems, Inc., and the
|
||||
# Organization for the Advancement of Structured Information
|
||||
# Standards (OASIS).
|
||||
#
|
||||
# This DTD is based on the CALS Table Model
|
||||
# PUBLIC "-//USA-DOD//DTD Table Model 951010//EN"
|
||||
#
|
||||
# $Id: calstblx.dtd 6340 2006-10-03 13:23:24Z nwalsh $
|
||||
#
|
||||
# Permission to use, copy, modify and distribute the DocBook DTD
|
||||
# and its accompanying documentation for any purpose and without fee
|
||||
# is hereby granted in perpetuity, provided that the above copyright
|
||||
# notice and this paragraph appear in all copies. The copyright
|
||||
# holders make no representation about the suitability of the DTD for
|
||||
# any purpose. It is provided "as is" without expressed or implied
|
||||
# warranty.
|
||||
#
|
||||
# If you modify the DocBook DTD in any way, except for declaring and
|
||||
# referencing additional sets of general entities and declaring
|
||||
# additional notations, label your DTD as a variant of DocBook. See
|
||||
# the maintenance documentation for more information.
|
||||
#
|
||||
# Please direct all questions, bug reports, or suggestions for
|
||||
# changes to the docbook@lists.oasis-open.org mailing list. For more
|
||||
# information, see http://www.oasis-open.org/docbook/.
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# This module contains the definitions for the CALS Table Model
|
||||
# converted to XML. It has been modified slightly for use in the
|
||||
# combined HTML/CALS models supported by DocBook V4.5.
|
||||
|
||||
# These definitions are not directly related to the table model, but are
|
||||
# used in the default CALS table model and are usually defined elsewhere
|
||||
# (and prior to the inclusion of this table module) in a CALS DTD.
|
||||
|
||||
# no if zero(s),
|
||||
# yes if any other digits value
|
||||
|
||||
yesorno = string
|
||||
titles = title?
|
||||
# default for use in entry content
|
||||
|
||||
# The parameter entities as defined below provide the CALS table model
|
||||
# as published (as part of the Example DTD) in MIL-HDBK-28001.
|
||||
#
|
||||
# These following declarations provide the CALS-compliant default definitions
|
||||
# for these entities. However, these entities can and should be redefined
|
||||
# (by giving the appropriate parameter entity declaration(s) prior to the
|
||||
# reference to this Table Model declaration set entity) to fit the needs
|
||||
# of the current application.
|
||||
tbl.table-titles.mdl = titles
|
||||
tbl.table-main.mdl = tgroup+ | graphic+
|
||||
tbl.tgroup.mdl = colspec*, spanspec*, thead?, tfoot?, tbody
|
||||
tbl.tgroup.att = attribute tgroupstyle { text }?
|
||||
tbl.row.mdl = (entry | entrytbl)+
|
||||
tbl.entrytbl.mdl = colspec*, spanspec*, thead?, tbody
|
||||
# ===== Element and attribute declarations follow. =====
|
||||
|
||||
# doc:A formal table in a document.
|
||||
table = element table { table.attlist, tbl.table.mdl }
|
||||
table.attlist &=
|
||||
attribute frame { tbl.frame.attval }?,
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
tbl.table.att,
|
||||
bodyatt,
|
||||
secur
|
||||
# doc:A wrapper for the main content of a table, or part of a table.
|
||||
tgroup = element tgroup { tgroup.attlist, tbl.tgroup.mdl }
|
||||
tgroup.attlist &=
|
||||
attribute cols { text },
|
||||
tbl.tgroup.att,
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute align { "left" | "right" | "center" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?,
|
||||
secur
|
||||
# doc:Specifications for a column in a table.
|
||||
colspec = element colspec { colspec.attlist, empty }
|
||||
colspec.attlist &=
|
||||
attribute colnum { text }?,
|
||||
attribute colname { text }?,
|
||||
attribute colwidth { text }?,
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute align { "left" | "right" | "center" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?
|
||||
# doc:Formatting information for a spanned column in a table.
|
||||
spanspec = element spanspec { spanspec.attlist, empty }
|
||||
spanspec.attlist &=
|
||||
attribute namest { text },
|
||||
attribute nameend { text },
|
||||
attribute spanname { text },
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute align { "left" | "right" | "center" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?
|
||||
# doc:A table header consisting of one or more rows.
|
||||
thead = element thead { thead.attlist, tbl.hdft.mdl }
|
||||
thead.attlist &=
|
||||
attribute valign { "top" | "middle" | "bottom" }?,
|
||||
secur
|
||||
# doc:A table footer consisting of one or more rows.
|
||||
tfoot = element tfoot { tfoot.attlist, tbl.hdft.mdl }
|
||||
tfoot.attlist &=
|
||||
attribute valign { "top" | "middle" | "bottom" }?,
|
||||
secur
|
||||
# doc:A wrapper for the rows of a table or informal table.
|
||||
tbody = element tbody { tbody.attlist, tbl.tbody.mdl }
|
||||
tbody.attlist &=
|
||||
attribute valign { "top" | "middle" | "bottom" }?,
|
||||
secur
|
||||
# doc:A row in a table.
|
||||
row = element row { row.attlist, tbl.row.mdl }
|
||||
row.attlist &=
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute valign { "top" | "middle" | "bottom" }?,
|
||||
secur
|
||||
# doc:A subtable appearing in place of an Entry in a table.
|
||||
entrytbl = element entrytbl { entrytbl.attlist, tbl.entrytbl.mdl }
|
||||
entrytbl.attlist &=
|
||||
attribute cols { text },
|
||||
tbl.tgroup.att,
|
||||
attribute colname { text }?,
|
||||
attribute spanname { text }?,
|
||||
attribute namest { text }?,
|
||||
attribute nameend { text }?,
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute align { "left" | "right" | "center" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?,
|
||||
secur
|
||||
# doc:A cell in a table.
|
||||
entry = element entry { entry.attlist, tbl.entry.mdl* }
|
||||
entry.attlist &=
|
||||
attribute colname { text }?,
|
||||
attribute namest { text }?,
|
||||
attribute nameend { text }?,
|
||||
attribute spanname { text }?,
|
||||
attribute morerows { text }?,
|
||||
attribute colsep { yesorno }?,
|
||||
attribute rowsep { yesorno }?,
|
||||
attribute align { "left" | "right" | "center" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?,
|
||||
attribute rotate { yesorno }?,
|
||||
attribute valign { "top" | "middle" | "bottom" }?,
|
||||
secur
|
||||
# End of DocBook CALS Table Model V4.5 .................................
|
||||
|
||||
# ......................................................................
|
File diff suppressed because it is too large
Load diff
|
@ -1,85 +0,0 @@
|
|||
# ......................................................................
|
||||
|
||||
# DocBook notations module V4.5 ........................................
|
||||
|
||||
# File dbnotnx.mod .....................................................
|
||||
|
||||
# Copyright 1992-2004 HaL Computer Systems, Inc.,
|
||||
# O'Reilly & Associates, Inc., ArborText, Inc., Fujitsu Software
|
||||
# Corporation, Norman Walsh, Sun Microsystems, Inc., and the
|
||||
# Organization for the Advancement of Structured Information
|
||||
# Standards (OASIS).
|
||||
#
|
||||
# $Id: dbnotnx.mod 6340 2006-10-03 13:23:24Z nwalsh $
|
||||
#
|
||||
# Permission to use, copy, modify and distribute the DocBook DTD
|
||||
# and its accompanying documentation for any purpose and without fee
|
||||
# is hereby granted in perpetuity, provided that the above copyright
|
||||
# notice and this paragraph appear in all copies. The copyright
|
||||
# holders make no representation about the suitability of the DTD for
|
||||
# any purpose. It is provided "as is" without expressed or implied
|
||||
# warranty.
|
||||
#
|
||||
# If you modify the DocBook DTD in any way, except for declaring and
|
||||
# referencing additional sets of general entities and declaring
|
||||
# additional notations, label your DTD as a variant of DocBook. See
|
||||
# the maintenance documentation for more information.
|
||||
#
|
||||
# Please direct all questions, bug reports, or suggestions for
|
||||
# changes to the docbook@lists.oasis-open.org mailing list. For more
|
||||
# information, see http://www.oasis-open.org/docbook/.
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# This module contains the notation declarations used by DocBook.
|
||||
#
|
||||
# In DTD driver files referring to this module, please use an entity
|
||||
# declaration that uses the public identifier shown below:
|
||||
#
|
||||
# <!ENTITY % dbnotn PUBLIC
|
||||
# "-//OASIS//ENTITIES DocBook Notations V4.5//EN"
|
||||
# "dbnotnx.mod">
|
||||
# %dbnotn;
|
||||
#
|
||||
# See the documentation for detailed information on the parameter
|
||||
# entity and module scheme used in DocBook, customizing DocBook and
|
||||
# planning for interchange, and changes made since the last release
|
||||
# of DocBook.
|
||||
|
||||
local.notation.class = notAllowed
|
||||
notation.class =
|
||||
"BMP"
|
||||
| "CGM-CHAR"
|
||||
| "CGM-BINARY"
|
||||
| "CGM-CLEAR"
|
||||
| "DITROFF"
|
||||
| "DVI"
|
||||
| "EPS"
|
||||
| "EQN"
|
||||
| "FAX"
|
||||
| "GIF"
|
||||
| "GIF87a"
|
||||
| "GIF89a"
|
||||
| "JPG"
|
||||
| "JPEG"
|
||||
| "IGES"
|
||||
| "PCX"
|
||||
| "PIC"
|
||||
| "PNG"
|
||||
| "PS"
|
||||
| "SGML"
|
||||
| "TBL"
|
||||
| "TEX"
|
||||
| "TIFF"
|
||||
| "WMF"
|
||||
| "WPG"
|
||||
| "SVG"
|
||||
| "PDF"
|
||||
| "SWF"
|
||||
| "linespecific"
|
||||
| local.notation.class
|
||||
# WordPerfect Graphic format
|
||||
|
||||
# End of DocBook notations module V4.5 .................................
|
||||
|
||||
# ......................................................................
|
File diff suppressed because it is too large
Load diff
|
@ -1,499 +0,0 @@
|
|||
# ......................................................................
|
||||
|
||||
# DocBook XML DTD V4.5 .................................................
|
||||
|
||||
# File docbookx.dtd ....................................................
|
||||
|
||||
# Copyright 1992-2006 HaL Computer Systems, Inc.,
|
||||
# O'Reilly & Associates, Inc., ArborText, Inc., Fujitsu Software
|
||||
# Corporation, Norman Walsh, Sun Microsystems, Inc., and the
|
||||
# Organization for the Advancement of Structured Information
|
||||
# Standards (OASIS).
|
||||
#
|
||||
# See also http://docbook.org/specs/
|
||||
#
|
||||
# $Id: docbookx.dtd 6340 2006-10-03 13:23:24Z nwalsh $
|
||||
#
|
||||
# Permission to use, copy, modify and distribute the DocBook XML DTD
|
||||
# and its accompanying documentation for any purpose and without fee
|
||||
# is hereby granted in perpetuity, provided that the above copyright
|
||||
# notice and this paragraph appear in all copies. The copyright
|
||||
# holders make no representation about the suitability of the DTD for
|
||||
# any purpose. It is provided "as is" without expressed or implied
|
||||
# warranty.
|
||||
#
|
||||
# If you modify the DocBook DTD in any way, except for declaring and
|
||||
# referencing additional sets of general entities and declaring
|
||||
# additional notations, label your DTD as a variant of DocBook. See
|
||||
# the maintenance documentation for more information.
|
||||
#
|
||||
# Please direct all questions, bug reports, or suggestions for
|
||||
# changes to the docbook@lists.oasis-open.org mailing list. For more
|
||||
# information, see http://www.oasis-open.org/docbook/.
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# This is the driver file for V4.5 of the DocBook DTD.
|
||||
# Please use the following formal public identifier to identify it:
|
||||
#
|
||||
# "-//OASIS//DTD DocBook XML V4.5//EN"
|
||||
#
|
||||
# For example, if your document's top-level element is Book, and
|
||||
# you are using DocBook directly, use the FPI in the DOCTYPE
|
||||
# declaration:
|
||||
#
|
||||
# <!DOCTYPE book PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN"
|
||||
# "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd"
|
||||
# [...]>
|
||||
#
|
||||
# Or, if you have a higher-level driver file that customizes DocBook,
|
||||
# use the FPI in the parameter entity declaration:
|
||||
#
|
||||
# <!ENTITY % DocBookDTD PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN"
|
||||
# "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd">
|
||||
# %DocBookDTD;
|
||||
#
|
||||
# See the documentation for detailed information on the parameter
|
||||
# entity and module scheme used in DocBook, customizing DocBook and
|
||||
# planning for interchange, and changes made since the last release
|
||||
# of DocBook.
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# Enable SGML features .................................................
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# Notation declarations ................................................
|
||||
|
||||
include "dbnotnx.rnc"
|
||||
# ......................................................................
|
||||
|
||||
# ISO character entity sets ............................................
|
||||
|
||||
# euro sign, U+20AC NEW
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# DTD modules ..........................................................
|
||||
|
||||
# Information pool ..............
|
||||
include "dbpoolx.rnc"
|
||||
# Redeclaration placeholder .....
|
||||
|
||||
# Document hierarchy ............
|
||||
include "dbhierx.rnc"
|
||||
start =
|
||||
articleinfo
|
||||
| honorific
|
||||
| legalnotice
|
||||
| procedure
|
||||
| simplelist
|
||||
| keycode
|
||||
| refsynopsisdiv
|
||||
| article
|
||||
| phrase
|
||||
| destructorsynopsis
|
||||
| itemizedlist
|
||||
| audioobject
|
||||
| link
|
||||
| sect1info
|
||||
| xref
|
||||
| glossaryinfo
|
||||
| varname
|
||||
| keywordset
|
||||
| informalequation
|
||||
| toc
|
||||
| pagenums
|
||||
| lot
|
||||
| shortcut
|
||||
| glosslist
|
||||
| option
|
||||
| bibliosource
|
||||
| variablelist
|
||||
| filename
|
||||
| pob
|
||||
| colgroup
|
||||
| foreignphrase
|
||||
| group
|
||||
| substeps
|
||||
| conftitle
|
||||
| textobject
|
||||
| menuchoice
|
||||
| colspec
|
||||
| contractsponsor
|
||||
| tocback
|
||||
| contractnum
|
||||
| constant
|
||||
| dedication
|
||||
| inlineequation
|
||||
| bibliographyinfo
|
||||
| country
|
||||
| glossseealso
|
||||
| bridgehead
|
||||
| mousebutton
|
||||
| surname
|
||||
| stepalternatives
|
||||
| tertiaryie
|
||||
| mediaobject
|
||||
| msgentry
|
||||
| fax
|
||||
| initializer
|
||||
| table
|
||||
| task
|
||||
| setinfo
|
||||
| videodata
|
||||
| bibliodiv
|
||||
| issuenum
|
||||
| phone
|
||||
| state
|
||||
| refsynopsisdivinfo
|
||||
| member
|
||||
| glossentry
|
||||
| term
|
||||
| msgtext
|
||||
| tr
|
||||
| errortype
|
||||
| confdates
|
||||
| inlinegraphic
|
||||
| th
|
||||
| segmentedlist
|
||||
| remark
|
||||
| preface
|
||||
| structname
|
||||
| publisher
|
||||
| td
|
||||
| oointerface
|
||||
| refsection
|
||||
| type
|
||||
| taskrelated
|
||||
| msgrel
|
||||
| artpagenums
|
||||
| bibliomixed
|
||||
| revnumber
|
||||
| firstterm
|
||||
| seeie
|
||||
| spanspec
|
||||
| toclevel5
|
||||
| trademark
|
||||
| toclevel4
|
||||
| toclevel3
|
||||
| toclevel2
|
||||
| indexentry
|
||||
| toclevel1
|
||||
| colophon
|
||||
| methodparam
|
||||
| sidebarinfo
|
||||
| productnumber
|
||||
| funcprototype
|
||||
| inlinemediaobject
|
||||
| refclass
|
||||
| lotentry
|
||||
| paramdef
|
||||
| classsynopsisinfo
|
||||
| qandaset
|
||||
| footnote
|
||||
| msglevel
|
||||
| keysym
|
||||
| citation
|
||||
| simplemsgentry
|
||||
| othercredit
|
||||
| subjectset
|
||||
| keycap
|
||||
| orderedlist
|
||||
| refmiscinfo
|
||||
| blockinfo
|
||||
| programlistingco
|
||||
| abbrev
|
||||
| sidebar
|
||||
| informalfigure
|
||||
| tip
|
||||
| primaryie
|
||||
| appendixinfo
|
||||
| partintro
|
||||
| glossdiv
|
||||
| confgroup
|
||||
| segtitle
|
||||
| taskprerequisites
|
||||
| street
|
||||
| tbody
|
||||
| caption
|
||||
| markup
|
||||
| setindex
|
||||
| msgsub
|
||||
| subscript
|
||||
| orgname
|
||||
| fieldsynopsis
|
||||
| refname
|
||||
| void
|
||||
| sect5
|
||||
| sect4
|
||||
| sect3
|
||||
| chapter
|
||||
| sect2
|
||||
| sect1
|
||||
| modifier
|
||||
| col
|
||||
| orgdiv
|
||||
| city
|
||||
| bibliolist
|
||||
| funcparams
|
||||
| application
|
||||
| \token
|
||||
| imageobject
|
||||
| literal
|
||||
| funcsynopsis
|
||||
| olink
|
||||
| package
|
||||
| collab
|
||||
| seealsoie
|
||||
| primary
|
||||
| glossterm
|
||||
| termdef
|
||||
| area
|
||||
| ackno
|
||||
| function
|
||||
| collabname
|
||||
| lineannotation
|
||||
| guisubmenu
|
||||
| msgexplan
|
||||
| errorname
|
||||
| property
|
||||
| synopfragmentref
|
||||
| refentryinfo
|
||||
| entry
|
||||
| manvolnum
|
||||
| synopsis
|
||||
| emphasis
|
||||
| appendix
|
||||
| bookinfo
|
||||
| contrib
|
||||
| otheraddr
|
||||
| copyright
|
||||
| methodname
|
||||
| email
|
||||
| ooclass
|
||||
| videoobject
|
||||
| abstract
|
||||
| firstname
|
||||
| revremark
|
||||
| glossdef
|
||||
| guibutton
|
||||
| informalexample
|
||||
| screen
|
||||
| errorcode
|
||||
| command
|
||||
| seriesvolnums
|
||||
| refpurpose
|
||||
| parameter
|
||||
| equation
|
||||
| tfoot
|
||||
| code
|
||||
| jobtitle
|
||||
| sgmltag
|
||||
| screenco
|
||||
| holder
|
||||
| isbn
|
||||
| corpcredit
|
||||
| biblioset
|
||||
| part
|
||||
| symbol
|
||||
| row
|
||||
| bibliomisc
|
||||
| imagedata
|
||||
| secondary
|
||||
| classname
|
||||
| callout
|
||||
| screenshot
|
||||
| bibliomset
|
||||
| indexterm
|
||||
| refsect3
|
||||
| tocchap
|
||||
| para
|
||||
| refsect2
|
||||
| refsect1
|
||||
| date
|
||||
| refdescriptor
|
||||
| wordasword
|
||||
| epigraph
|
||||
| audiodata
|
||||
| hardware
|
||||
| confsponsor
|
||||
| authorgroup
|
||||
| warning
|
||||
| authorinitials
|
||||
| medialabel
|
||||
| varlistentry
|
||||
| authorblurb
|
||||
| itermset
|
||||
| refsect3info
|
||||
| informaltable
|
||||
| guimenuitem
|
||||
| postcode
|
||||
| subjectterm
|
||||
| refnamediv
|
||||
| note
|
||||
| figure
|
||||
| envar
|
||||
| listitem
|
||||
| methodsynopsis
|
||||
| affiliation
|
||||
| funcsynopsisinfo
|
||||
| structfield
|
||||
| blockquote
|
||||
| keyword
|
||||
| chapterinfo
|
||||
| tertiary
|
||||
| year
|
||||
| subtitle
|
||||
| personblurb
|
||||
| refentry
|
||||
| citebiblioid
|
||||
| seglistitem
|
||||
| bibliography
|
||||
| msg
|
||||
| constructorsynopsis
|
||||
| refsect2info
|
||||
| volumenum
|
||||
| database
|
||||
| funcdef
|
||||
| uri
|
||||
| graphicco
|
||||
| biblioid
|
||||
| msgmain
|
||||
| printhistory
|
||||
| glosssee
|
||||
| beginpage
|
||||
| glossary
|
||||
| set
|
||||
| highlights
|
||||
| objectinfo
|
||||
| tocpart
|
||||
| guiicon
|
||||
| revhistory
|
||||
| seg
|
||||
| see
|
||||
| msgorig
|
||||
| areaspec
|
||||
| partinfo
|
||||
| index
|
||||
| sectioninfo
|
||||
| refsectioninfo
|
||||
| optional
|
||||
| confnum
|
||||
| replaceable
|
||||
| refsect1info
|
||||
| corpauthor
|
||||
| step
|
||||
| anchor
|
||||
| arg
|
||||
| mathphrase
|
||||
| setindexinfo
|
||||
| keycombo
|
||||
| address
|
||||
| cmdsynopsis
|
||||
| computeroutput
|
||||
| literallayout
|
||||
| qandaentry
|
||||
| sect5info
|
||||
| bibliocoverage
|
||||
| coref
|
||||
| editor
|
||||
| superscript
|
||||
| personname
|
||||
| pubsnumber
|
||||
| graphic
|
||||
| simplesect
|
||||
| accel
|
||||
| secondaryie
|
||||
| biblioref
|
||||
| publishername
|
||||
| bibliorelation
|
||||
| prefaceinfo
|
||||
| revision
|
||||
| screeninfo
|
||||
| sbr
|
||||
| example
|
||||
| citetitle
|
||||
| issn
|
||||
| invpartnumber
|
||||
| indexdiv
|
||||
| sect4info
|
||||
| corpname
|
||||
| lineage
|
||||
| ooexception
|
||||
| reference
|
||||
| revdescription
|
||||
| title
|
||||
| edition
|
||||
| co
|
||||
| msgaud
|
||||
| guimenu
|
||||
| shortaffil
|
||||
| titleabbrev
|
||||
| msginfo
|
||||
| refmeta
|
||||
| qandadiv
|
||||
| mediaobjectco
|
||||
| seealso
|
||||
| exceptionname
|
||||
| answer
|
||||
| programlisting
|
||||
| tgroup
|
||||
| refentrytitle
|
||||
| book
|
||||
| errortext
|
||||
| varargs
|
||||
| sect3info
|
||||
| citerefentry
|
||||
| tasksummary
|
||||
| quote
|
||||
| othername
|
||||
| prompt
|
||||
| entrytbl
|
||||
| interfacename
|
||||
| acronym
|
||||
| modespec
|
||||
| msgset
|
||||
| thead
|
||||
| textdata
|
||||
| userinput
|
||||
| attribution
|
||||
| footnoteref
|
||||
| action
|
||||
| tocentry
|
||||
| tocfront
|
||||
| author
|
||||
| imageobjectco
|
||||
| alt
|
||||
| question
|
||||
| ulink
|
||||
| subject
|
||||
| pubdate
|
||||
| returnvalue
|
||||
| label
|
||||
| caution
|
||||
| section
|
||||
| systemitem
|
||||
| referenceinfo
|
||||
| sect2info
|
||||
| calloutlist
|
||||
| classsynopsis
|
||||
| productname
|
||||
| simpara
|
||||
| synopfragment
|
||||
| important
|
||||
| interface
|
||||
| releaseinfo
|
||||
| formalpara
|
||||
| areaset
|
||||
| biblioentry
|
||||
| indexinfo
|
||||
| guilabel
|
||||
# ......................................................................
|
||||
|
||||
# Other general entities ...............................................
|
||||
|
||||
# End of DocBook XML DTD V4.5 ..........................................
|
||||
|
||||
# ......................................................................
|
|
@ -1,225 +0,0 @@
|
|||
# ......................................................................
|
||||
|
||||
# DocBook XML HTML Table Module V4.5 ...................................
|
||||
|
||||
# File htmltblx.mod ....................................................
|
||||
|
||||
# Copyright 2003-2006 ArborText, Inc., Norman Walsh, Sun Microsystems,
|
||||
# Inc., and the Organization for the Advancement of Structured Information
|
||||
# Standards (OASIS).
|
||||
#
|
||||
# $Id: htmltblx.mod 6340 2006-10-03 13:23:24Z nwalsh $
|
||||
#
|
||||
# Permission to use, copy, modify and distribute the DocBook XML DTD
|
||||
# and its accompanying documentation for any purpose and without fee
|
||||
# is hereby granted in perpetuity, provided that the above copyright
|
||||
# notice and this paragraph appear in all copies. The copyright
|
||||
# holders make no representation about the suitability of the DTD for
|
||||
# any purpose. It is provided "as is" without expressed or implied
|
||||
# warranty.
|
||||
#
|
||||
# If you modify the DocBook XML DTD in any way, except for declaring and
|
||||
# referencing additional sets of general entities and declaring
|
||||
# additional notations, label your DTD as a variant of DocBook. See
|
||||
# the maintenance documentation for more information.
|
||||
#
|
||||
# Please direct all questions, bug reports, or suggestions for
|
||||
# changes to the docbook@lists.oasis-open.org mailing list. For more
|
||||
# information, see http://www.oasis-open.org/docbook/.
|
||||
|
||||
# ......................................................................
|
||||
|
||||
# This module contains the definitions for elements that are
|
||||
# isomorphic to the HTML elements. One could argue we should
|
||||
# instead have based ourselves on the XHTML Table Module, but the
|
||||
# HTML one is more like what browsers are likely to accept today
|
||||
# and users are likely to use.
|
||||
#
|
||||
# This module has been developed for use with the DocBook V4.5
|
||||
# "union table model" in which elements and attlists common to both
|
||||
# models are defined (as the union) in the CALS table module by
|
||||
# setting various parameter entities appropriately in this file.
|
||||
#
|
||||
# In DTD driver files referring to this module, please use an entity
|
||||
# declaration that uses the public identifier shown below:
|
||||
#
|
||||
# <!ENTITY % htmltbl PUBLIC
|
||||
# "-//OASIS//ELEMENTS DocBook XML HTML Tables V4.5//EN"
|
||||
# "htmltblx.mod">
|
||||
# %htmltbl;
|
||||
#
|
||||
# See the documentation for detailed information on the parameter
|
||||
# entity and module scheme used in DocBook, customizing DocBook and
|
||||
# planning for interchange, and changes made since the last release
|
||||
# of DocBook.
|
||||
|
||||
# ======================= XHTML Tables =======================================
|
||||
|
||||
namespace a = "http://relaxng.org/ns/compatibility/annotations/1.0"
|
||||
|
||||
html.coreattrs =
|
||||
common.attrib,
|
||||
attribute class { text }?,
|
||||
attribute style { text }?,
|
||||
attribute title { text }?
|
||||
# Does not contain lang or dir because they are in %common.attribs
|
||||
i18n = attribute xml:lang { xsd:NMTOKEN }?
|
||||
events =
|
||||
attribute onclick { text }?,
|
||||
attribute ondblclick { text }?,
|
||||
attribute onmousedown { text }?,
|
||||
attribute onmouseup { text }?,
|
||||
attribute onmouseover { text }?,
|
||||
attribute onmousemove { text }?,
|
||||
attribute onmouseout { text }?,
|
||||
attribute onkeypress { text }?,
|
||||
attribute onkeydown { text }?,
|
||||
attribute onkeyup { text }?
|
||||
attrs = html.coreattrs, i18n, events
|
||||
cellhalign =
|
||||
attribute align { "left" | "center" | "right" | "justify" | "char" }?,
|
||||
attribute char { text }?,
|
||||
attribute charoff { text }?
|
||||
cellvalign =
|
||||
attribute valign { "top" | "middle" | "bottom" | "baseline" }?
|
||||
# doc:A group of columns in an HTML table.
|
||||
colgroup = element colgroup { colgroup.attlist, col* }
|
||||
# doc:Specifications for a column in an HTML table.
|
||||
col = element col { col.attlist, empty }
|
||||
# doc:A row in an HTML table.
|
||||
tr = element tr { tr.attlist, (th | td)+ }
|
||||
# doc:A table header entry in an HTML table.
|
||||
th =
|
||||
element th {
|
||||
th.attlist, (para.char.mix | tabentry.mix | table | informaltable)*
|
||||
}
|
||||
# doc:A table ntry in an HTML table.
|
||||
td =
|
||||
element td {
|
||||
td.attlist, (para.char.mix | tabentry.mix | table | informaltable)*
|
||||
}
|
||||
colgroup.attlist &=
|
||||
attrs,
|
||||
[ a:defaultValue = "1" ] attribute span { text }?,
|
||||
attribute width { text }?,
|
||||
cellhalign,
|
||||
cellvalign
|
||||
col.attlist &=
|
||||
attrs,
|
||||
[ a:defaultValue = "1" ] attribute span { text }?,
|
||||
attribute width { text }?,
|
||||
cellhalign,
|
||||
cellvalign
|
||||
tr.attlist &=
|
||||
attrs,
|
||||
cellhalign,
|
||||
cellvalign,
|
||||
attribute bgcolor { text }?
|
||||
th.attlist &=
|
||||
attrs,
|
||||
attribute abbr { text }?,
|
||||
attribute axis { text }?,
|
||||
attribute headers { xsd:IDREFS }?,
|
||||
attribute scope { "row" | "col" | "rowgroup" | "colgroup" }?,
|
||||
[ a:defaultValue = "1" ] attribute rowspan { text }?,
|
||||
[ a:defaultValue = "1" ] attribute colspan { text }?,
|
||||
cellhalign,
|
||||
cellvalign,
|
||||
attribute nowrap { "nowrap" }?,
|
||||
attribute bgcolor { text }?,
|
||||
attribute width { text }?,
|
||||
attribute height { text }?
|
||||
td.attlist &=
|
||||
attrs,
|
||||
attribute abbr { text }?,
|
||||
attribute axis { text }?,
|
||||
attribute headers { xsd:IDREFS }?,
|
||||
attribute scope { "row" | "col" | "rowgroup" | "colgroup" }?,
|
||||
[ a:defaultValue = "1" ] attribute rowspan { text }?,
|
||||
[ a:defaultValue = "1" ] attribute colspan { text }?,
|
||||
cellhalign,
|
||||
cellvalign,
|
||||
attribute nowrap { "nowrap" }?,
|
||||
attribute bgcolor { text }?,
|
||||
attribute width { text }?,
|
||||
attribute height { text }?
|
||||
# ======================================================
|
||||
|
||||
# Set up to read in the CALS model configured to
|
||||
# merge with the XHTML table model
|
||||
|
||||
# ======================================================
|
||||
tables.role.attrib = role.attrib
|
||||
# Add label and role attributes to table and informaltable
|
||||
bodyatt =
|
||||
attribute floatstyle { text }?,
|
||||
attribute rowheader { "firstcol" | "norowheader" }?,
|
||||
label.attrib
|
||||
# Add common attributes to Table, TGroup, TBody, THead, TFoot, Row,
|
||||
# EntryTbl, and Entry (and InformalTable element).
|
||||
secur =
|
||||
common.attrib,
|
||||
attribute class { text }?,
|
||||
attribute style { text }?,
|
||||
attribute title { text }?,
|
||||
i18n,
|
||||
events,
|
||||
tables.role.attrib
|
||||
common.table.attribs = bodyatt, secur
|
||||
# Content model for Table (that also allows HTML tables)
|
||||
tbl.table.mdl =
|
||||
(blockinfo?,
|
||||
formalobject.title.content,
|
||||
ndxterm.class*,
|
||||
textobject*,
|
||||
(graphic+ | mediaobject+ | tgroup+))
|
||||
| (caption, (col* | colgroup*), thead?, tfoot?, (tbody+ | tr+))
|
||||
informal.tbl.table.mdl =
|
||||
(textobject*, (graphic+ | mediaobject+ | tgroup+))
|
||||
| ((col* | colgroup*), thead?, tfoot?, (tbody+ | tr+))
|
||||
# Attributes for Table (including HTML ones)
|
||||
|
||||
# N.B. rules = (none | groups | rows | cols | all) but it can't be spec'd
|
||||
|
||||
# that way because 'all' already occurs in a different enumeration in
|
||||
|
||||
# CALS tables (frame).
|
||||
tbl.table.att =
|
||||
attribute tabstyle { text }?,
|
||||
attribute tocentry { yesorno.attvals }?,
|
||||
attribute shortentry { yesorno.attvals }?,
|
||||
attribute orient { "port" | "land" }?,
|
||||
attribute pgwide { yesorno.attvals }?,
|
||||
attribute summary { text }?,
|
||||
attribute width { text }?,
|
||||
attribute border { text }?,
|
||||
attribute rules { text }?,
|
||||
attribute cellspacing { text }?,
|
||||
attribute cellpadding { text }?,
|
||||
attribute align { "left" | "center" | "right" }?,
|
||||
attribute bgcolor { text }?
|
||||
tbl.frame.attval =
|
||||
"void"
|
||||
| "above"
|
||||
| "below"
|
||||
| "hsides"
|
||||
| "lhs"
|
||||
| "rhs"
|
||||
| "vsides"
|
||||
| "box"
|
||||
| "border"
|
||||
| "top"
|
||||
| "bottom"
|
||||
| "topbot"
|
||||
| "all"
|
||||
| "sides"
|
||||
| "none"
|
||||
# Allow either objects or inlines; beware of REs between elements.
|
||||
tbl.entry.mdl = para.char.mix | tabentry.mix
|
||||
# thead, tfoot, and tbody are defined in both table models,
|
||||
# so we set up parameter entities to define union models for them
|
||||
tbl.hdft.mdl = tr+ | (colspec*, row+)
|
||||
tbl.tbody.mdl = tr+ | row+
|
||||
# End of DocBook XML HTML Table Module V4.5 ............................
|
||||
|
||||
# ......................................................................
|
|
@ -1,35 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE authorgroup PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
<!ENTITY % BOOK_ENTITIES SYSTEM "Defensive_Coding.ent">
|
||||
%BOOK_ENTITIES;
|
||||
]>
|
||||
<authorgroup>
|
||||
<author>
|
||||
<firstname>Florian</firstname>
|
||||
<surname>Weimer</surname>
|
||||
<affiliation>
|
||||
<orgname>Red Hat</orgname>
|
||||
<orgdiv>Product Security Team</orgdiv>
|
||||
</affiliation>
|
||||
<email>fweimer@redhat.com</email>
|
||||
</author>
|
||||
<author>
|
||||
<firstname>Nikos</firstname>
|
||||
<surname>Mavrogiannopoulos</surname>
|
||||
<affiliation>
|
||||
<orgname>Red Hat</orgname>
|
||||
<orgdiv>Crypto Team</orgdiv>
|
||||
</affiliation>
|
||||
<email>nmav@redhat.com</email>
|
||||
</author>
|
||||
<author>
|
||||
<firstname>Robert</firstname>
|
||||
<surname>Relyea</surname>
|
||||
<affiliation>
|
||||
<orgname>Red Hat</orgname>
|
||||
<orgdiv>Crypto Team</orgdiv>
|
||||
</affiliation>
|
||||
<email>rrelyea@redhat.com</email>
|
||||
</author>
|
||||
</authorgroup>
|
||||
|
|
@ -1,29 +0,0 @@
|
|||
<?xml version='1.0' encoding='UTF-8' ?>
|
||||
<!DOCTYPE bookinfo PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<bookinfo id="book-Defensive_Coding">
|
||||
<title>Defensive Coding</title>
|
||||
<subtitle>A Guide to Improving Software Security</subtitle>
|
||||
<edition>1</edition>
|
||||
<pubsnumber>1</pubsnumber>
|
||||
<productname>Unofficial fork</productname>
|
||||
<productnumber></productnumber>
|
||||
<abstract>
|
||||
<para>
|
||||
This document provides guidelines for improving software
|
||||
security through secure coding. It covers common
|
||||
programming languages and libraries, and focuses on
|
||||
concrete recommendations.
|
||||
</para>
|
||||
</abstract>
|
||||
<corpauthor>
|
||||
<inlinemediaobject>
|
||||
<imageobject>
|
||||
<imagedata fileref="Common_Content/images/title_logo.svg" format="SVG" />
|
||||
</imageobject>
|
||||
</inlinemediaobject>
|
||||
</corpauthor>
|
||||
<xi:include href="Common_Content/Legal_Notice.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Author_Group.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</bookinfo>
|
||||
|
|
@ -1,209 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-C-Allocators">
|
||||
<title>Memory Allocators</title>
|
||||
|
||||
<section>
|
||||
<title><function>malloc</function> and Related Functions</title>
|
||||
<para>
|
||||
The C library interfaces for memory allocation are provided by
|
||||
<function>malloc</function>, <function>free</function> and
|
||||
<function>realloc</function>, and the
|
||||
<function>calloc</function> function. In addition to these
|
||||
generic functions, there are derived functions such as
|
||||
<function>strdup</function> which perform allocation using
|
||||
<function>malloc</function> internally, but do not return
|
||||
untyped heap memory (which could be used for any object).
|
||||
</para>
|
||||
<para>
|
||||
The C compiler knows about these functions and can use their
|
||||
expected behavior for optimizations. For instance, the compiler
|
||||
assumes that an existing pointer (or a pointer derived from an
|
||||
existing pointer by arithmetic) will not point into the memory
|
||||
area returned by <function>malloc</function>.
|
||||
</para>
|
||||
<para>
|
||||
If the allocation fails, <function>realloc</function> does not
|
||||
free the old pointer. Therefore, the idiom <literal>ptr =
|
||||
realloc(ptr, size);</literal> is wrong because the memory
|
||||
pointed to by <literal>ptr</literal> leaks in case of an error.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-C-Use-After-Free">
|
||||
<title>Use-after-free errors</title>
|
||||
<para>
|
||||
After <function>free</function>, the pointer is invalid.
|
||||
Further pointer dereferences are not allowed (and are usually
|
||||
detected by <application>valgrind</application>). Less obvious
|
||||
is that any <emphasis>use</emphasis> of the old pointer value is
|
||||
not allowed, either. In particular, comparisons with any other
|
||||
pointer (or the null pointer) are undefined according to the C
|
||||
standard.
|
||||
</para>
|
||||
<para>
|
||||
The same rules apply to <function>realloc</function> if the
|
||||
memory area cannot be enlarged in-place. For instance, the
|
||||
compiler may assume that a comparison between the old and new
|
||||
pointer will always return false, so it is impossible to detect
|
||||
movement this way.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Handling Memory Allocation Errors</title>
|
||||
<para>
|
||||
Recovering from out-of-memory errors is often difficult or even
|
||||
impossible. In these cases, <function>malloc</function> and
|
||||
other allocation functions return a null pointer. Dereferencing
|
||||
this pointer lead to a crash. Such dereferences can even be
|
||||
exploitable for code execution if the dereference is combined
|
||||
with an array subscript.
|
||||
</para>
|
||||
<para>
|
||||
In general, if you cannot check all allocation calls and
|
||||
handle failure, you should abort the program on allocation
|
||||
failure, and not rely on the null pointer dereference to
|
||||
terminate the process. See
|
||||
<xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Serialization-Decoders"/>
|
||||
for related memory allocation concerns.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Allocators-alloca">
|
||||
<title><function>alloca</function> and Other Forms of Stack-based
|
||||
Allocation</title>
|
||||
<para>
|
||||
Allocation on the stack is risky because stack overflow checking
|
||||
is implicit. There is a guard page at the end of the memory
|
||||
area reserved for the stack. If the program attempts to read
|
||||
from or write to this guard page, a <literal>SIGSEGV</literal>
|
||||
signal is generated and the program typically terminates.
|
||||
</para>
|
||||
<para>
|
||||
This is sufficient for detecting typical stack overflow
|
||||
situations such as unbounded recursion, but it fails when the
|
||||
stack grows in increments larger than the size of the guard
|
||||
page. In this case, it is possible that the stack pointer ends
|
||||
up pointing into a memory area which has been allocated for a
|
||||
different purposes. Such misbehavior can be exploitable.
|
||||
</para>
|
||||
<para>
|
||||
A common source for large stack growth are calls to
|
||||
<function>alloca</function> and related functions such as
|
||||
<function>strdupa</function>. These functions should be avoided
|
||||
because of the lack of error checking. (They can be used safely
|
||||
if the allocated size is less than the page size (typically,
|
||||
4096 bytes), but this case is relatively rare.) Additionally,
|
||||
relying on <function>alloca</function> makes it more difficult
|
||||
to reorganize the code because it is not allowed to use the
|
||||
pointer after the function calling <function>alloca</function>
|
||||
has returned, even if this function has been inlined into its
|
||||
caller.
|
||||
</para>
|
||||
<para>
|
||||
Similar concerns apply to <emphasis>variable-length
|
||||
arrays</emphasis> (VLAs), a feature of the C99 standard which
|
||||
started as a GNU extension. For large objects exceeding the
|
||||
page size, there is no error checking, either.
|
||||
</para>
|
||||
<para>
|
||||
In both cases, negative or very large sizes can trigger a
|
||||
stack-pointer wraparound, and the stack pointer and end up
|
||||
pointing into caller stack frames, which is fatal and can be
|
||||
exploitable.
|
||||
</para>
|
||||
<para>
|
||||
If you want to use <function>alloca</function> or VLAs for
|
||||
performance reasons, consider using a small on-stack array (less
|
||||
than the page size, large enough to fulfill most requests). If
|
||||
the requested size is small enough, use the on-stack array.
|
||||
Otherwise, call <function>malloc</function>. When exiting the
|
||||
function, check if <function>malloc</function> had been called,
|
||||
and free the buffer as needed.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Allocators-Arrays">
|
||||
<title>Array Allocation</title>
|
||||
<para>
|
||||
When allocating arrays, it is important to check for overflows.
|
||||
The <function>calloc</function> function performs such checks.
|
||||
</para>
|
||||
<para>
|
||||
If <function>malloc</function> or <function>realloc</function>
|
||||
is used, the size check must be written manually. For instance,
|
||||
to allocate an array of <literal>n</literal> elements of type
|
||||
<literal>T</literal>, check that the requested size is not
|
||||
greater than <literal>((size_t) -1) / sizeof(T)</literal>. See
|
||||
<xref linkend="sect-Defensive_Coding-C-Arithmetic"/>.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Allocators-Custom">
|
||||
<title>Custom Memory Allocators</title>
|
||||
<para>
|
||||
Custom memory allocates come in two forms: replacements for
|
||||
<function>malloc</function>, and completely different interfaces
|
||||
for memory management. Both approaches can reduce the
|
||||
effectiveness of <application>valgrind</application> and similar
|
||||
tools, and the heap corruption detection provided by GNU libc, so
|
||||
they should be avoided.
|
||||
</para>
|
||||
<para>
|
||||
Memory allocators are difficult to write and contain many
|
||||
performance and security pitfalls.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
When computing array sizes or rounding up allocation
|
||||
requests (to the next allocation granularity, or for
|
||||
alignment purposes), checks for arithmetic overflow are
|
||||
required.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Size computations for array allocations need overflow
|
||||
checking. See <xref
|
||||
linkend="sect-Defensive_Coding-C-Allocators-Arrays"/>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
It can be difficult to beat well-tuned general-purpose
|
||||
allocators. In micro benchmarks, pool allocators can show
|
||||
huge wins, and size-specific pools can reduce internal
|
||||
fragmentation. But often, utilization of individual pools
|
||||
is poor, and external fragmentation increases the overall
|
||||
memory usage.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Conservative Garbage Collection</title>
|
||||
<para>
|
||||
Garbage collection can be an alternative to explicit memory
|
||||
management using <function>malloc</function> and
|
||||
<function>free</function>. The Boehm-Dehmers-Weiser allocator
|
||||
can be used from C programs, with minimal type annotations.
|
||||
Performance is competitive with <function>malloc</function> on
|
||||
64-bit architectures, especially for multi-threaded programs.
|
||||
The stop-the-world pauses may be problematic for some real-time
|
||||
applications, though.
|
||||
</para>
|
||||
<para>
|
||||
However, using a conservative garbage collector may reduce
|
||||
opportunities for code reduce because once one library in a
|
||||
program uses garbage collection, the whole process memory needs
|
||||
to be subject to it, so that no pointers are missed. The
|
||||
Boehm-Dehmers-Weiser collector also reserves certain signals for
|
||||
internal use, so it is not fully transparent to the rest of the
|
||||
program.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
|
@ -1,221 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-C-Language">
|
||||
<title>The Core Language</title>
|
||||
<para>
|
||||
C provides no memory safety. Most recommendations in this section
|
||||
deal with this aspect of the language.
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Undefined">
|
||||
<title>Undefined Behavior</title>
|
||||
<para>
|
||||
Some C constructs are defined to be undefined by the C standard.
|
||||
This does not only mean that the standard does not describe
|
||||
what happens when the construct is executed. It also allows
|
||||
optimizing compilers such as GCC to assume that this particular
|
||||
construct is never reached. In some cases, this has caused
|
||||
GCC to optimize security checks away. (This is not a flaw in GCC
|
||||
or the C language. But C certainly has some areas which are more
|
||||
difficult to use than others.)
|
||||
</para>
|
||||
|
||||
<para>
|
||||
Common sources of undefined behavior are:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>out-of-bounds array accesses</para></listitem>
|
||||
<listitem><para>null pointer dereferences</para></listitem>
|
||||
<listitem><para>overflow in signed integer arithmetic</para></listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Pointers">
|
||||
<title>Recommendations for Pointers and Array Handling</title>
|
||||
<para>
|
||||
Always keep track of the size of the array you are working with.
|
||||
Often, code is more obviously correct when you keep a pointer
|
||||
past the last element of the array, and calculate the number of
|
||||
remaining elements by substracting the current position from
|
||||
that pointer. The alternative, updating a separate variable
|
||||
every time when the position is advanced, is usually less
|
||||
obviously correct.
|
||||
</para>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-C-Pointers-remaining"/>
|
||||
shows how to extract Pascal-style strings from a character
|
||||
buffer. The two pointers kept for length checks are
|
||||
<varname>inend</varname> and <varname>outend</varname>.
|
||||
<varname>inp</varname> and <varname>outp</varname> are the
|
||||
respective positions.
|
||||
The number of input bytes is checked using the expression
|
||||
<literal>len > (size_t)(inend - inp)</literal>.
|
||||
The cast silences a compiler warning;
|
||||
<varname>inend</varname> is always larger than
|
||||
<varname>inp</varname>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-C-Pointers-remaining">
|
||||
<title>Array processing in C</title>
|
||||
<xi:include href="snippets/C-Pointers-remaining.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
It is important that the length checks always have the form
|
||||
<literal>len > (size_t)(inend - inp)</literal>, where
|
||||
<varname>len</varname> is a variable of type
|
||||
<type>size_t</type> which denotes the <emphasis>total</emphasis>
|
||||
number of bytes which are about to be read or written next. In
|
||||
general, it is not safe to fold multiple such checks into one,
|
||||
as in <literal>len1 + len2 > (size_t)(inend - inp)</literal>,
|
||||
because the expression on the left can overflow or wrap around
|
||||
(see <xref linkend="sect-Defensive_Coding-C-Arithmetic"/>), and it
|
||||
no longer reflects the number of bytes to be processed.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Arithmetic">
|
||||
<title>Recommendations for Integer Arithmetic</title>
|
||||
<para>
|
||||
Overflow in signed integer arithmetic is undefined. This means
|
||||
that it is not possible to check for overflow after it happened,
|
||||
see <xref linkend="ex-Defensive_Coding-C-Arithmetic-bad"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-C-Arithmetic-bad">
|
||||
<title>Incorrect overflow detection in C</title>
|
||||
<xi:include href="snippets/C-Arithmetic-add.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The following approaches can be used to check for overflow,
|
||||
without actually causing it.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Use a wider type to perform the calculation, check that the
|
||||
result is within bounds, and convert the result to the
|
||||
original type. All intermediate results must be checked in
|
||||
this way.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Perform the calculation in the corresponding unsigned type
|
||||
and use bit fiddling to detect the overflow.
|
||||
<xref linkend="ex-Defensive_Coding-C-Arithmetic-add_unsigned"/>
|
||||
shows how to perform an overflow check for unsigned integer
|
||||
addition. For three or more terms, all the intermediate
|
||||
additions have to be checked in this way.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<example id="ex-Defensive_Coding-C-Arithmetic-add_unsigned">
|
||||
<title>Overflow checking for unsigned addition</title>
|
||||
<xi:include href="snippets/C-Arithmetic-add_unsigned.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Compute bounds for acceptable input values which are known
|
||||
to avoid overflow, and reject other values. This is the
|
||||
preferred way for overflow checking on multiplications,
|
||||
see <xref linkend="ex-Defensive_Coding-C-Arithmetic-mult"/>.
|
||||
<!-- This approach can result in bogus compiler warnings
|
||||
with signed types:
|
||||
http://gcc.gnu.org/bugzilla/post_bug.cgi -->
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<example id="ex-Defensive_Coding-C-Arithmetic-mult">
|
||||
<title>Overflow checking for unsigned multiplication</title>
|
||||
<xi:include href="snippets/C-Arithmetic-mult.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Basic arithmetic operations are commutative, so for bounds checks,
|
||||
there are two different but mathematically equivalent
|
||||
expressions. Sometimes, one of the expressions results in
|
||||
better code because parts of it can be reduced to a constant.
|
||||
This applies to overflow checks for multiplication <literal>a *
|
||||
b</literal> involving a constant <literal>a</literal>, where the
|
||||
expression is reduced to <literal>b > C</literal> for some
|
||||
constant <literal>C</literal> determined at compile time. The
|
||||
other expression, <literal>b && a > ((unsigned)-1) /
|
||||
b</literal>, is more difficult to optimize at compile time.
|
||||
</para>
|
||||
<para>
|
||||
When a value is converted to a signed integer, GCC always
|
||||
chooses the result based on 2's complement arithmetic. This GCC
|
||||
extension (which is also implemented by other compilers) helps a
|
||||
lot when implementing overflow checks.
|
||||
</para>
|
||||
<para>
|
||||
Sometimes, it is necessary to compare unsigned and signed
|
||||
integer variables. This results in a compiler warning,
|
||||
<emphasis>comparison between signed and unsigned integer
|
||||
expressions</emphasis>, because the comparison often gives
|
||||
unexpected results for negative values. When adding a cast,
|
||||
make sure that negative values are covered properly. If the
|
||||
bound is unsigned and the checked quantity is signed, you should
|
||||
cast the checked quantity to an unsigned type as least as wide
|
||||
as either operand type. As a result, negative values will fail
|
||||
the bounds check. (You can still check for negative values
|
||||
separately for clarity, and the compiler will optimize away this
|
||||
redundant check.)
|
||||
</para>
|
||||
<para>
|
||||
Legacy code should be compiled with the <option>-fwrapv</option>
|
||||
GCC option. As a result, GCC will provide 2's complement
|
||||
semantics for integer arithmetic, including defined behavior on
|
||||
integer overflow.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-C-Globals">
|
||||
<title>Global Variables</title>
|
||||
<para>
|
||||
Global variables should be avoided because they usually lead to
|
||||
thread safety hazards. In any case, they should be declared
|
||||
<literal>static</literal>, so that access is restricted to a
|
||||
single translation unit.
|
||||
</para>
|
||||
<para>
|
||||
Global constants are not a problem, but declaring them can be
|
||||
tricky. <xref linkend="ex-Defensive_Coding-C-Globals-String_Array"/>
|
||||
shows how to declare a constant array of constant strings.
|
||||
The second <literal>const</literal> is needed to make the
|
||||
array constant, and not just the strings. It must be placed
|
||||
after the <literal>*</literal>, and not before it.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-C-Globals-String_Array">
|
||||
<title>Declaring a constant array of constant strings</title>
|
||||
<xi:include href="snippets/C-Globals-String_Array.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Sometimes, static variables local to functions are used as a
|
||||
replacement for proper memory management. Unlike non-static
|
||||
local variables, it is possible to return a pointer to static
|
||||
local variables to the caller. But such variables are
|
||||
well-hidden, but effectively global (just as static variables at
|
||||
file scope). It is difficult to add thread safety afterwards if
|
||||
such interfaces are used. Merely dropping the
|
||||
<literal>static</literal> keyword in such cases leads to
|
||||
undefined behavior.
|
||||
</para>
|
||||
<para>
|
||||
Another source for static local variables is a desire to reduce
|
||||
stack space usage on embedded platforms, where the stack may
|
||||
span only a few hundred bytes. If this is the only reason why
|
||||
the <literal>static</literal> keyword is used, it can just be
|
||||
dropped, unless the object is very large (larger than
|
||||
128 kilobytes on 32 bit platforms). In the latter case, it is
|
||||
recommended to allocate the object using
|
||||
<literal>malloc</literal>, to obtain proper array checking, for
|
||||
the same reasons outlined in <xref
|
||||
linkend="sect-Defensive_Coding-C-Allocators-alloca"/>.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
352
en-US/C-Libc.xml
352
en-US/C-Libc.xml
|
@ -1,352 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-C-Libc">
|
||||
<title>The C Standard Library</title>
|
||||
<para>
|
||||
Parts of the C standard library (and the UNIX and GNU extensions)
|
||||
are difficult to use, so you should avoid them.
|
||||
</para>
|
||||
<para>
|
||||
Please check the applicable documentation before using the
|
||||
recommended replacements. Many of these functions allocate
|
||||
buffers using <function>malloc</function> which your code must
|
||||
deallocate explicitly using <function>free</function>.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-C-Absolutely-Banned">
|
||||
<title>Absolutely Banned Interfaces</title>
|
||||
<para>
|
||||
The functions listed below must not be used because they are
|
||||
almost always unsafe. Use the indicated replacements instead.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><function>gets</function>
|
||||
⟶ <function>fgets</function></para></listitem>
|
||||
<listitem><para><function>getwd</function>
|
||||
⟶ <function>getcwd</function>
|
||||
or <function>get_current_dir_name</function></para></listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>readdir_r</function> ⟶ <function>readdir</function>
|
||||
<!-- It is quite complicated to allocate a properly-sized
|
||||
buffer for use with readdir_r, and readdir provides
|
||||
sufficient thread safety guarantees. -->
|
||||
<!-- ??? Add File_System cross-reference -->
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>realpath</function> (with a non-NULL second parameter)
|
||||
⟶ <function>realpath</function> with NULL as the second parameter,
|
||||
or <function>canonicalize_file_name</function>
|
||||
<!-- It is complicated to allocate a properly-sized buffer
|
||||
for use with realpath. -->
|
||||
<!-- ??? Add File_System cross-reference -->
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
The constants listed below must not be used, either. Instead,
|
||||
code must allocate memory dynamically and use interfaces with
|
||||
length checking.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>NAME_MAX</literal> (limit not actually enforced by
|
||||
the kernel)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>PATH_MAX</literal> (limit not actually enforced by
|
||||
the kernel)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>_PC_NAME_MAX</literal> (This limit, returned by the
|
||||
<function>pathconf</function> function, is not enforced by
|
||||
the kernel.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>_PC_PATH_MAX</literal> (This limit, returned by the
|
||||
<function>pathconf</function> function, is not enforced by
|
||||
the kernel.)
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
The following structure members must not be used.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>f_namemax</literal> in <literal>struct
|
||||
statvfs</literal> (limit not actually enforced by the kernel,
|
||||
see <literal>_PC_NAME_MAX</literal> above)
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-C-Avoid">
|
||||
<title>Functions to Avoid</title>
|
||||
<para>
|
||||
The following string manipulation functions can be used securely
|
||||
in principle, but their use should be avoided because they are
|
||||
difficult to use correctly. Calls to these functions can be
|
||||
replaced with <function>asprintf</function> or
|
||||
<function>vasprintf</function>. (For non-GNU targets, these
|
||||
functions are available from Gnulib.) In some cases, the
|
||||
<function>snprintf</function> function might be a suitable
|
||||
replacement, see <xref
|
||||
linkend="sect-Defensive_Coding-C-String-Functions-Length"/>.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><function>sprintf</function></para></listitem>
|
||||
<listitem><para><function>strcat</function></para></listitem>
|
||||
<listitem><para><function>strcpy</function></para></listitem>
|
||||
<listitem><para><function>vsprintf</function></para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Use the indicated replacements for the functions below.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>alloca</function> ⟶
|
||||
<function>malloc</function> and <function>free</function>
|
||||
(see <xref linkend="sect-Defensive_Coding-C-Allocators-alloca"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>putenv</function> ⟶
|
||||
explicit <varname>envp</varname> argument in process creation
|
||||
(see <xref linkend="sect-Defensive_Coding-Tasks-Processes-environ"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>setenv</function> ⟶
|
||||
explicit <varname>envp</varname> argument in process creation
|
||||
(see <xref linkend="sect-Defensive_Coding-Tasks-Processes-environ"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>strdupa</function> ⟶
|
||||
<function>strdup</function> and <function>free</function>
|
||||
(see <xref linkend="sect-Defensive_Coding-C-Allocators-alloca"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>strndupa</function> ⟶
|
||||
<function>strndup</function> and <function>free</function>
|
||||
(see <xref linkend="sect-Defensive_Coding-C-Allocators-alloca"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>system</function> ⟶
|
||||
<function>posix_spawn</function>
|
||||
or <function>fork</function>/<function>execve</function>/
|
||||
(see <xref linkend="sect-Defensive_Coding-Tasks-Processes-execve"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>unsetenv</function> ⟶
|
||||
explicit <varname>envp</varname> argument in process creation
|
||||
(see <xref linkend="sect-Defensive_Coding-Tasks-Processes-environ"/>)
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-C-String-Functions-Length">
|
||||
<title>String Functions with Explicit Length Arguments</title>
|
||||
<para>
|
||||
The C run-time library provides string manipulation functions
|
||||
which not just look for NUL characters for string termination,
|
||||
but also honor explicit lengths provided by the caller.
|
||||
However, these functions evolved over a long period of time, and
|
||||
the lengths mean different things depending on the function.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-C-Libc-snprintf">
|
||||
<title><literal>snprintf</literal></title>
|
||||
<para>
|
||||
The <function>snprintf</function> function provides a way to
|
||||
construct a string in a statically-sized buffer. (If the buffer
|
||||
size is allocated on the heap, consider use
|
||||
<function>asprintf</function> instead.)
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/C-String-Functions-snprintf.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
The second argument to the <function>snprintf</function> call
|
||||
should always be the size of the buffer in the first argument
|
||||
(which should be a character array). Elaborate pointer and
|
||||
length arithmetic can introduce errors and nullify the
|
||||
security benefits of <function>snprintf</function>.
|
||||
</para>
|
||||
<para>
|
||||
In particular, <literal>snprintf</literal> is not well-suited
|
||||
to constructing a string iteratively, by appending to an
|
||||
existing buffer. <function>snprintf</function> returns one of
|
||||
two values, <literal>-1</literal> on errors, or the number of
|
||||
characters which <emphasis>would have been written to the
|
||||
buffer if the buffer were large enough</emphasis>. This means
|
||||
that adding the result of <function>snprintf</function> to the
|
||||
buffer pointer to skip over the characters just written is
|
||||
incorrect and risky. However, as long as the length argument
|
||||
is not zero, the buffer will remain null-terminated. <xref
|
||||
linkend="ex-Defensive_Coding-C-String-Functions-snprintf-incremental"/>
|
||||
works because <literal>end -current > 0</literal> is a loop
|
||||
invariant. After the loop, the result string is in the
|
||||
<varname>buf</varname> variable.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-C-String-Functions-snprintf-incremental">
|
||||
<title>Repeatedly writing to a buffer using <function>snprintf</function></title>
|
||||
<xi:include href="snippets/C-String-Functions-snprintf-incremental.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
If you want to avoid the call to <function>strlen</function>
|
||||
for performance reasons, you have to check for a negative
|
||||
return value from <function>snprintf</function> and also check
|
||||
if the return value is equal to the specified buffer length or
|
||||
larger. Only if neither condition applies, you may advance
|
||||
the pointer to the start of the write buffer by the number
|
||||
return by <function>snprintf</function>. However, this
|
||||
optimization is rarely worthwhile.
|
||||
</para>
|
||||
<para>
|
||||
Note that it is not permitted to use the same buffer both as
|
||||
the destination and as a source argument.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-C-Libc-vsnprintf">
|
||||
<title><literal>vsnprintf</literal> and Format Strings</title>
|
||||
<para>
|
||||
If you use <function>vsnprintf</function> (or
|
||||
<function>vasprintf</function> or even
|
||||
<function>snprintf</function>) with a format string which is
|
||||
not a constant, but a function argument, it is important to
|
||||
annotate the function with a <literal>format</literal>
|
||||
function attribute, so that GCC can warn about misuse of your
|
||||
function (see <xref
|
||||
linkend="ex-Defensive_Coding-C-String-Functions-format-Attribute"/>).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-C-String-Functions-format-Attribute">
|
||||
<title>The <literal>format</literal> function attribute</title>
|
||||
<xi:include href="snippets/C-String-Functions-format.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-C-Libc-strncpy">
|
||||
<title><function>strncpy</function></title>
|
||||
<para>
|
||||
The <function>strncpy</function> function does not ensure that
|
||||
the target buffer is null-terminated. A common idiom for
|
||||
ensuring NUL termination is:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/C-String-Functions-strncpy.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
Another approach uses the <function>strncat</function>
|
||||
function for this purpose:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/C-String-Functions-strncat-as-strncpy.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-C-Libc-strncat">
|
||||
<title><function>strncat</function></title>
|
||||
<para>
|
||||
The length argument of the <function>strncat</function>
|
||||
function specifies the maximum number of characters copied
|
||||
from the source buffer, excluding the terminating NUL
|
||||
character. This means that the required number of bytes in
|
||||
the destination buffer is the length of the original string,
|
||||
plus the length argument in the <function>strncat</function>
|
||||
call, plus one. Consequently, this function is rarely
|
||||
appropriate for performing a length-checked string operation,
|
||||
with the notable exception of the <function>strcpy</function>
|
||||
emulation described in <xref
|
||||
linkend="sect-Defensive_Coding-C-Libc-strncpy"/>.
|
||||
</para>
|
||||
<para>
|
||||
To implement a length-checked string append, you can use an
|
||||
approach similar to <xref
|
||||
linkend="ex-Defensive_Coding-C-String-Functions-snprintf-incremental"/>:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/C-String-Functions-strncat-emulation.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
In many cases, including this one, the string concatenation
|
||||
can be avoided by combining everything into a single format
|
||||
string:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/C-String-Functions-strncat-merged.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
But you should must not dynamically construct format strings
|
||||
to avoid concatenation because this would prevent GCC from
|
||||
type-checking the argument lists.
|
||||
</para>
|
||||
<para>
|
||||
It is not possible to use format strings like
|
||||
<literal>"%s%s"</literal> to implement concatenation, unless
|
||||
you use separate buffers. <function>snprintf</function> does
|
||||
not support overlapping source and target strings.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title><function>strlcpy</function> and
|
||||
<function>strlcat</function></title>
|
||||
<para>
|
||||
Some systems support <function>strlcpy</function> and
|
||||
<function>strlcat</function> functions which behave this way,
|
||||
but these functions are not part of GNU libc.
|
||||
<function>strlcpy</function> is often replaced with
|
||||
<function>snprintf</function> with a <literal>"%s"</literal>
|
||||
format string. See <xref
|
||||
linkend="sect-Defensive_Coding-C-Libc-strncpy"/> for a caveat
|
||||
related to the <function>snprintf</function> return value.
|
||||
</para>
|
||||
<para>
|
||||
To emulate <function>strlcat</function>, use the approach
|
||||
described in <xref
|
||||
linkend="sect-Defensive_Coding-C-Libc-strncat"/>.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>ISO C11 Annex K *<function>_s</function> functions</title>
|
||||
<para>
|
||||
ISO C11 adds another set of length-checking functions, but GNU
|
||||
libc currently does not implement them.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Other <function>strn</function>* and
|
||||
<function>stpn</function>* functions</title>
|
||||
<para>
|
||||
GNU libc contains additional functions with different variants
|
||||
of length checking. Consult the documentation before using
|
||||
them to find out what the length actually means.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
</section>
|
|
@ -1,70 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-C-Other">
|
||||
<title>Other C-related Topics</title>
|
||||
<section id="sect-Defensive_Coding-C-Wrapper-Functions">
|
||||
<title>Wrapper Functions</title>
|
||||
<para>
|
||||
Some libraries provide wrappers for standard library functions.
|
||||
Common cases include allocation functions such as
|
||||
<function>xmalloc</function> which abort the process on
|
||||
allocation failure (instead of returning a
|
||||
<literal>NULL</literal> pointer), or alternatives to relatively
|
||||
recent library additions such as <function>snprintf</function>
|
||||
(along with implementations for systems which lack them).
|
||||
</para>
|
||||
<para>
|
||||
In general, such wrappers are a bad idea, particularly if they
|
||||
are not implemented as inline functions or preprocessor macros.
|
||||
The compiler lacks knowledge of such wrappers outside the
|
||||
translation unit which defines them, which means that some
|
||||
optimizations and security checks are not performed. Adding
|
||||
<literal>__attribute__</literal> annotations to function
|
||||
declarations can remedy this to some extent, but these
|
||||
annotations have to be maintained carefully for feature parity
|
||||
with the standard implementation.
|
||||
</para>
|
||||
<para>
|
||||
At the minimum, you should apply these attributes:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
If you wrap function which accepts are GCC-recognized format
|
||||
string (for example, a <function>printf</function>-style
|
||||
function used for logging), you should add a suitable
|
||||
<literal>format</literal> attribute, as in <xref
|
||||
linkend="ex-Defensive_Coding-C-String-Functions-format-Attribute"/>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
If you wrap a function which carries a
|
||||
<literal>warn_unused_result</literal> attribute and you
|
||||
propagate its return value, your wrapper should be declared
|
||||
with <literal>warn_unused_result</literal> as well.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Duplicating the buffer length checks based on the
|
||||
<function>__builtin_object_size</function> GCC builtin is
|
||||
desirable if the wrapper processes arrays. (This
|
||||
functionality is used by the
|
||||
<literal>-D_FORTIFY_SOURCE=2</literal> checks to guard
|
||||
against static buffer overflows.) However, designing
|
||||
appropriate interfaces and implementing the checks may not
|
||||
be entirely straightforward.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
For other attributes (such as <literal>malloc</literal>),
|
||||
careful analysis and comparison with the compiler documentation
|
||||
is required to check if propagating the attribute is
|
||||
appropriate. Incorrectly applied attributes can result in
|
||||
undesired behavioral changes in the compiled code.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
12
en-US/C.xml
12
en-US/C.xml
|
@ -1,12 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-C">
|
||||
<title>The C Programming Language</title>
|
||||
|
||||
<xi:include href="C-Language.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="C-Libc.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="C-Allocators.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="C-Other.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</chapter>
|
||||
|
|
@ -1,188 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-CXX-Language">
|
||||
<title>The Core Language</title>
|
||||
<para>
|
||||
C++ includes a large subset of the C language. As far as the C
|
||||
subset is used, the recommendations in <xref
|
||||
linkend="chap-Defensive_Coding-C"/> apply.
|
||||
</para>
|
||||
|
||||
<section>
|
||||
<title>Array Allocation with <literal>operator new[]</literal></title>
|
||||
<para>
|
||||
For very large values of <literal>n</literal>, an expression
|
||||
like <literal>new T[n]</literal> can return a pointer to a heap
|
||||
region which is too small. In other words, not all array
|
||||
elements are actually backed with heap memory reserved to the
|
||||
array. Current GCC versions generate code that performs a
|
||||
computation of the form <literal>sizeof(T) * size_t(n) +
|
||||
cookie_size</literal>, where <literal>cookie_size</literal> is
|
||||
currently at most 8. This computation can overflow, and GCC
|
||||
versions prior to 4.8 generated code which did not detect this.
|
||||
(Fedora 18 was the first release which fixed this in GCC.)
|
||||
</para>
|
||||
<para>
|
||||
The <literal>std::vector</literal> template can be used instead
|
||||
an explicit array allocation. (The GCC implementation detects
|
||||
overflow internally.)
|
||||
</para>
|
||||
<para>
|
||||
If there is no alternative to <literal>operator new[]</literal>
|
||||
and the sources will be compiled with older GCC versions, code
|
||||
which allocates arrays with a variable length must check for
|
||||
overflow manually. For the <literal>new T[n]</literal> example,
|
||||
the size check could be <literal>n || (n > 0 && n >
|
||||
(size_t(-1) - 8) / sizeof(T))</literal>. (See <xref
|
||||
linkend="sect-Defensive_Coding-C-Arithmetic"/>.) If there are
|
||||
additional dimensions (which must be constants according to the
|
||||
C++ standard), these should be included as factors in the
|
||||
divisor.
|
||||
</para>
|
||||
<para>
|
||||
These countermeasures prevent out-of-bounds writes and potential
|
||||
code execution. Very large memory allocations can still lead to
|
||||
a denial of service. <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Serialization-Decoders"/>
|
||||
contains suggestions for mitigating this problem when processing
|
||||
untrusted data.
|
||||
</para>
|
||||
<para>
|
||||
See <xref linkend="sect-Defensive_Coding-C-Allocators-Arrays"/>
|
||||
for array allocation advice for C-style memory allocation.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Overloading</title>
|
||||
<para>
|
||||
Do not overload functions with versions that have different
|
||||
security characteristics. For instance, do not implement a
|
||||
function <function>strcat</function> which works on
|
||||
<type>std::string</type> arguments. Similarly, do not name
|
||||
methods after such functions.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>ABI compatibility and preparing for security updates</title>
|
||||
<para>
|
||||
A stable binary interface (ABI) is vastly preferred for security
|
||||
updates. Without a stable ABI, all reverse dependencies need
|
||||
recompiling, which can be a lot of work and could even be
|
||||
impossible in some cases. Ideally, a security update only
|
||||
updates a single dynamic shared object, and is picked up
|
||||
automatically after restarting affected processes.
|
||||
</para>
|
||||
<para>
|
||||
Outside of extremely performance-critical code, you should
|
||||
ensure that a wide range of changes is possible without breaking
|
||||
ABI. Some very basic guidelines are:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Avoid inline functions.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Use the pointer-to-implementation idiom.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Try to avoid templates. Use them if the increased type
|
||||
safety provides a benefit to the programmer.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Move security-critical code out of templated code, so that
|
||||
it can be patched in a central place if necessary.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
The KDE project publishes a document with more extensive
|
||||
guidelines on ABI-preserving changes to C++ code, <ulink
|
||||
url="http://techbase.kde.org/Policies/Binary_Compatibility_Issues_With_C++">Policies/Binary
|
||||
Compatibility Issues With C++</ulink>
|
||||
(<emphasis>d-pointer</emphasis> refers to the
|
||||
pointer-to-implementation idiom).
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-CXX-Language-CXX11">
|
||||
<title>C++0X and C++11 Support</title>
|
||||
<para>
|
||||
GCC offers different language compatibility modes:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<option>-std=c++98</option> for the original 1998 C++
|
||||
standard
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<option>-std=c++03</option> for the 1998 standard with the
|
||||
changes from the TR1 technical report
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<option>-std=c++11</option> for the 2011 C++ standard. This
|
||||
option should not be used.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<option>-std=c++0x</option> for several different versions
|
||||
of C++11 support in development, depending on the GCC
|
||||
version. This option should not be used.
|
||||
<!-- There were two incompatibilies before GCC 4.7.2
|
||||
(std::list and std::pair), but link C++98 and C++11
|
||||
code is still unsupported, although it currently has
|
||||
some chance of working by accident. -->
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
For each of these flags, there are variants which also enable
|
||||
GNU extensions (mostly language features also found in C99 or
|
||||
C11): <option>-std=gnu++98</option>,
|
||||
<option>-std=gnu++03</option>, <option>-std=gnu++11</option>.
|
||||
Again, <option>-std=gnu++11</option> should not be used.
|
||||
</para>
|
||||
<para>
|
||||
If you enable C++11 support, the ABI of the standard C++ library
|
||||
<literal>libstdc++</literal> will change in subtle ways.
|
||||
Currently, no C++ libraries are compiled in C++11 mode, so if
|
||||
you compile your code in C++11 mode, it will be incompatible
|
||||
with the rest of the system. Unfortunately, this is also the
|
||||
case if you do not use any C++11 features. Currently, there is
|
||||
no safe way to enable C++11 mode (except for freestanding
|
||||
applications).
|
||||
</para>
|
||||
<para>
|
||||
The meaning of C++0X mode changed from GCC release to GCC
|
||||
release. Earlier versions were still ABI-compatible with C++98
|
||||
mode, but in the most recent versions, switching to C++0X mode
|
||||
activates C++11 support, with its compatibility problems.
|
||||
</para>
|
||||
<para>
|
||||
Some C++11 features (or approximations thereof) are available
|
||||
with TR1 support, that is, with <option>-std=c++03</option> or
|
||||
<option>-std=gnu++03</option> and in the
|
||||
<literal><tr1/*></literal> header files. This includes
|
||||
<literal>std::tr1::shared_ptr</literal> (from
|
||||
<literal><tr1/memory></literal>) and
|
||||
<literal>std::tr1::function</literal> (from
|
||||
<literal><tr1/functional></literal>). For other C++11
|
||||
features, the Boost C++ library contains replacements.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
|
@ -1,202 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-CXX-Std">
|
||||
<title>The C++ Standard Library</title>
|
||||
<para>
|
||||
The C++ standard library includes most of its C counterpart
|
||||
by reference, see <xref linkend="sect-Defensive_Coding-C-Libc"/>.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-CXX-Std-Functions">
|
||||
<title>Functions That Are Difficult to Use</title>
|
||||
<para>
|
||||
This section collects functions and function templates which are
|
||||
part of the standard library and are difficult to use.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-CXX-Std-Functions-Unpaired_Iterators">
|
||||
<title>Unpaired Iterators</title>
|
||||
<para>
|
||||
Functions which use output operators or iterators which do not
|
||||
come in pairs (denoting ranges) cannot perform iterator range
|
||||
checking.
|
||||
(See <xref linkend="sect-Defensive_Coding-CXX-Std-Iterators"/>)
|
||||
Function templates which involve output iterators are
|
||||
particularly dangerous:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><function>std::copy</function></para></listitem>
|
||||
<listitem><para><function>std::copy_backward</function></para></listitem>
|
||||
<listitem><para><function>std::copy_if</function></para></listitem>
|
||||
<listitem><para><function>std::move</function> (three-argument variant)</para></listitem>
|
||||
<listitem><para><function>std::move_backward</function></para></listitem>
|
||||
<listitem><para><function>std::partition_copy_if</function></para></listitem>
|
||||
<listitem><para><function>std::remove_copy</function></para></listitem>
|
||||
<listitem><para><function>std::remove_copy_if</function></para></listitem>
|
||||
<listitem><para><function>std::replace_copy</function></para></listitem>
|
||||
<listitem><para><function>std::replace_copy_if</function></para></listitem>
|
||||
<listitem><para><function>std::swap_ranges</function></para></listitem>
|
||||
<listitem><para><function>std::transform</function></para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
In addition, <function>std::copy_n</function>,
|
||||
<function>std::fill_n</function> and
|
||||
<function>std::generate_n</function> do not perform iterator
|
||||
checking, either, but there is an explicit count which has to be
|
||||
supplied by the caller, as opposed to an implicit length
|
||||
indicator in the form of a pair of forward iterators.
|
||||
</para>
|
||||
<para>
|
||||
These output-iterator-expecting functions should only be used
|
||||
with unlimited-range output iterators, such as iterators
|
||||
obtained with the <function>std::back_inserter</function>
|
||||
function.
|
||||
</para>
|
||||
<para>
|
||||
Other functions use single input or forward iterators, which can
|
||||
read beyond the end of the input range if the caller is not careful:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><function>std::equal</function></para></listitem>
|
||||
<listitem><para><function>std::is_permutation</function></para></listitem>
|
||||
<listitem><para><function>std::mismatch</function></para></listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-CXX-Std-String">
|
||||
<title>String Handling with <literal>std::string</literal></title>
|
||||
<para>
|
||||
The <literal>std::string</literal> class provides a convenient
|
||||
way to handle strings. Unlike C strings,
|
||||
<literal>std::string</literal> objects have an explicit length
|
||||
(and can contain embedded NUL characters), and storage for its
|
||||
characters is managed automatically. This section discusses
|
||||
<literal>std::string</literal>, but these observations also
|
||||
apply to other instances of the
|
||||
<literal>std::basic_string</literal> template.
|
||||
</para>
|
||||
<para>
|
||||
The pointer returned by the <function>data()</function> member
|
||||
function does not necessarily point to a NUL-terminated string.
|
||||
To obtain a C-compatible string pointer, use
|
||||
<function>c_str()</function> instead, which adds the NUL
|
||||
terminator.
|
||||
</para>
|
||||
<para>
|
||||
The pointers returned by the <function>data()</function> and
|
||||
<function>c_str()</function> functions and iterators are only
|
||||
valid until certain events happen. It is required that the
|
||||
exact <literal>std::string</literal> object still exists (even
|
||||
if it was initially created as a copy of another string object).
|
||||
Pointers and iterators are also invalidated when non-const
|
||||
member functions are called, or functions with a non-const
|
||||
reference parameter. The behavior of the GCC implementation
|
||||
deviates from that required by the C++ standard if multiple
|
||||
threads are present. In general, only the first call to a
|
||||
non-const member function after a structural modification of the
|
||||
string (such as appending a character) is invalidating, but this
|
||||
also applies to member function such as the non-const version of
|
||||
<function>begin()</function>, in violation of the C++ standard.
|
||||
</para>
|
||||
<para>
|
||||
Particular care is necessary when invoking the
|
||||
<function>c_str()</function> member function on a temporary
|
||||
object. This is convenient for calling C functions, but the
|
||||
pointer will turn invalid as soon as the temporary object is
|
||||
destroyed, which generally happens when the outermost expression
|
||||
enclosing the expression on which <function>c_str()</function>
|
||||
is called completes evaluation. Passing the result of
|
||||
<function>c_str()</function> to a function which does not store
|
||||
or otherwise leak that pointer is safe, though.
|
||||
</para>
|
||||
<para>
|
||||
Like with <literal>std::vector</literal> and
|
||||
<literal>std::array</literal>, subscribing with
|
||||
<literal>operator[]</literal> does not perform bounds checks.
|
||||
Use the <function>at(size_type)</function> member function
|
||||
instead. See <xref
|
||||
linkend="sect-Defensive_Coding-CXX-Std-Subscript"/>.
|
||||
Furthermore, accessing the terminating NUL character using
|
||||
<literal>operator[]</literal> is not possible. (In some
|
||||
implementations, the <literal>c_str()</literal> member function
|
||||
writes the NUL character on demand.)
|
||||
</para>
|
||||
<para>
|
||||
Never write to the pointers returned by
|
||||
<function>data()</function> or <function>c_str()</function>
|
||||
after casting away <literal>const</literal>. If you need a
|
||||
C-style writable string, use a
|
||||
<literal>std::vector<char></literal> object and its
|
||||
<function>data()</function> member function. In this case, you
|
||||
have to explicitly add the terminating NUL character.
|
||||
</para>
|
||||
<para>
|
||||
GCC's implementation of <literal>std::string</literal> is
|
||||
currently based on reference counting. It is expected that a
|
||||
future version will remove the reference counting, due to
|
||||
performance and conformance issues. As a result, code that
|
||||
implicitly assumes sharing by holding to pointers or iterators
|
||||
for too long will break, resulting in run-time crashes or worse.
|
||||
On the other hand, non-const iterator-returning functions will
|
||||
no longer give other threads an opportunity for invalidating
|
||||
existing iterators and pointers because iterator invalidation
|
||||
does not depend on sharing of the internal character array
|
||||
object anymore.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-CXX-Std-Subscript">
|
||||
<title>Containers and <literal>operator[]</literal></title>
|
||||
<para>
|
||||
Many sequence containers similar to <literal>std::vector</literal>
|
||||
provide both <literal>operator[](size_type)</literal> and a
|
||||
member function <literal>at(size_type)</literal>. This applies
|
||||
to <literal>std::vector</literal> itself,
|
||||
<literal>std::array</literal>, <literal>std::string</literal>
|
||||
and other instances of <literal>std::basic_string</literal>.
|
||||
</para>
|
||||
<para>
|
||||
<literal>operator[](size_type)</literal> is not required by the
|
||||
standard to perform bounds checking (and the implementation in
|
||||
GCC does not). In contrast, <literal>at(size_type)</literal>
|
||||
must perform such a check. Therefore, in code which is not
|
||||
performance-critical, you should prefer
|
||||
<literal>at(size_type)</literal> over
|
||||
<literal>operator[](size_type)</literal>, even though it is
|
||||
slightly more verbose.
|
||||
</para>
|
||||
<para>
|
||||
The <literal>front()</literal> and <literal>back()</literal>
|
||||
member functions are undefined if a vector object is empty. You
|
||||
can use <literal>vec.at(0)</literal> and
|
||||
<literal>vec.at(vec.size() - 1)</literal> as checked
|
||||
replacements. For an empty vector, <literal>data()</literal> is
|
||||
defined; it returns an arbitrary pointer, but not necessarily
|
||||
the NULL pointer.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-CXX-Std-Iterators">
|
||||
<title>Iterators</title>
|
||||
<para>
|
||||
Iterators do not perform any bounds checking. Therefore, all
|
||||
functions that work on iterators should accept them in pairs,
|
||||
denoting a range, and make sure that iterators are not moved
|
||||
outside that range. For forward iterators and bidirectional
|
||||
iterators, you need to check for equality before moving the
|
||||
first or last iterator in the range. For random-access
|
||||
iterators, you need to compute the difference before adding or
|
||||
subtracting an offset. It is not possible to perform the
|
||||
operation and check for an invalid operator afterwards.
|
||||
</para>
|
||||
<para>
|
||||
Output iterators cannot be compared for equality. Therefore, it
|
||||
is impossible to write code that detects that it has been
|
||||
supplied an output area that is too small, and their use should
|
||||
be avoided.
|
||||
</para>
|
||||
<para>
|
||||
These issues make some of the standard library functions
|
||||
difficult to use correctly, see <xref
|
||||
linkend="sect-Defensive_Coding-CXX-Std-Functions-Unpaired_Iterators"/>.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
|
@ -1,10 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-CXX">
|
||||
<title>The C++ Programming Language</title>
|
||||
|
||||
<xi:include href="CXX-Language.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="CXX-Std.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</chapter>
|
||||
|
|
@ -1,2 +0,0 @@
|
|||
<!ENTITY YEAR "2012-2017">
|
||||
<!ENTITY HOLDER "Red Hat, Inc">
|
|
@ -1,33 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE book PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd">
|
||||
<book>
|
||||
<xi:include href="Book_Info.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<part>
|
||||
<title>Programming Languages</title>
|
||||
<xi:include href="C.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="CXX.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Java.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Python.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Shell.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Go.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Vala.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</part>
|
||||
<part>
|
||||
<title>Specific Programming Tasks</title>
|
||||
<xi:include href="Tasks-Library_Design.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Descriptors.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-File_System.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Temporary_Files.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Processes.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Serialization.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Cryptography.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Tasks-Packaging.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</part>
|
||||
<part>
|
||||
<title>Implementing Security Features</title>
|
||||
<xi:include href="Features-Authentication.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Features-TLS.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Features-HSM.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</part>
|
||||
<xi:include href="Revision_History.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</book>
|
|
@ -1,189 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Authentication">
|
||||
<title>Authentication and Authorization</title>
|
||||
|
||||
<section id="sect-Defensive_Coding-Authentication-Server">
|
||||
<title>Authenticating Servers</title>
|
||||
<para>
|
||||
When connecting to a server, a client has to make sure that it
|
||||
is actually talking to the server it expects. There are two
|
||||
different aspects, securing the network path, and making sure
|
||||
that the expected user runs the process on the target host.
|
||||
There are several ways to ensure that:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The server uses a TLS certificate which is valid according
|
||||
to the web browser public key infrastructure, and the client
|
||||
verifies the certificate and the host name.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The server uses a TLS certificate which is expected by the
|
||||
client (perhaps it is stored in a configuration file read by
|
||||
the client). In this case, no host name checking is
|
||||
required.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
On Linux, UNIX domain sockets (of the
|
||||
<literal>PF_UNIX</literal> protocol family, sometimes called
|
||||
<literal>PF_LOCAL</literal>) are restricted by file system
|
||||
permissions. If the server socket path is not
|
||||
world-writable, the server identity cannot be spoofed by
|
||||
local users.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Port numbers less than 1024 (<emphasis>trusted
|
||||
ports</emphasis>) can only be used by
|
||||
<literal>root</literal>, so if a UDP or TCP server is
|
||||
running on the local host and it uses a trusted port, its
|
||||
identity is assured. (Not all operating systems enforce the
|
||||
trusted ports concept, and the network might not be trusted,
|
||||
so it is only useful on the local system.)
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
TLS (<xref linkend="chap-Defensive_Coding-TLS"/>) is the
|
||||
recommended way for securing connections over untrusted
|
||||
networks.
|
||||
</para>
|
||||
<para>
|
||||
If the server port number is 1024 is higher, a local user can
|
||||
impersonate the process by binding to this socket, perhaps after
|
||||
crashing the real server by exploiting a denial-of-service
|
||||
vulnerability.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Authentication-Host_based">
|
||||
<title>Host-based Authentication</title>
|
||||
<para>
|
||||
Host-based authentication uses access control lists (ACLs) to
|
||||
accept or deny requests from clients. This authentication
|
||||
method comes in two flavors: IP-based (or, more generally,
|
||||
address-based) and name-based (with the name coming from DNS or
|
||||
<filename>/etc/hosts</filename>). IP-based ACLs often use
|
||||
prefix notation to extend access to entire subnets. Name-based
|
||||
ACLs sometimes use wildcards for adding groups of hosts (from
|
||||
entire DNS subtrees). (In the SSH context, host-based
|
||||
authentication means something completely different and is not
|
||||
covered in this section.)
|
||||
</para>
|
||||
<para>
|
||||
Host-based authentication trust the network and may not offer
|
||||
sufficient granularity, so it has to be considered a weak form
|
||||
of authentication. On the other hand, IP-based authentication
|
||||
can be made extremely robust and can be applied very early in
|
||||
input processing, so it offers an opportunity for significantly
|
||||
reducing the number of potential attackers for many services.
|
||||
</para>
|
||||
<para>
|
||||
The names returned by <function>gethostbyaddr</function> and
|
||||
<function>getnameinfo</function> functions cannot be trusted.
|
||||
(DNS PTR records can be set to arbitrary values, not just names
|
||||
belong to the address owner.) If these names are used for ACL
|
||||
matching, a forward lookup using
|
||||
<function>gethostbyaddr</function> or
|
||||
<function>getaddrinfo</function> has to be performed. The name
|
||||
is only valid if the original address is found among the results
|
||||
of the forward lookup (<emphasis>double-reverse
|
||||
lookup</emphasis>).
|
||||
</para>
|
||||
<para>
|
||||
An empty ACL should deny all access (deny-by-default). If empty
|
||||
ACLs permits all access, configuring any access list must switch
|
||||
to deny-by-default for all unconfigured protocols, in both
|
||||
name-based and address-based variants.
|
||||
</para>
|
||||
<para>
|
||||
Similarly, if an address or name is not matched by the list, it
|
||||
should be denied. However, many implementations behave
|
||||
differently, so the actual behavior must be documented properly.
|
||||
</para>
|
||||
<para>
|
||||
IPv6 addresses can embed IPv4 addresses. There is no
|
||||
universally correct way to deal with this ambiguity. The
|
||||
behavior of the ACL implementation should be documented.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Authentication-UNIX_Domain">
|
||||
<title>UNIX Domain Socket Authentication</title>
|
||||
<para>
|
||||
UNIX domain sockets (with address family
|
||||
<literal>AF_UNIX</literal> or <literal>AF_LOCAL</literal>) are
|
||||
restricted to the local host and offer a special authentication
|
||||
mechanism: credentials passing.
|
||||
</para>
|
||||
<para>
|
||||
Nowadays, most systems support the
|
||||
<literal>SO_PEERCRED</literal> (Linux) or
|
||||
<literal>LOCAL_PEERCRED</literal> (FreeBSD) socket options, or
|
||||
the <function>getpeereid</function> (other BSDs, OS X).
|
||||
These interfaces provide direct access to the (effective) user
|
||||
ID on the other end of a domain socket connect, without
|
||||
cooperation from the other end.
|
||||
</para>
|
||||
<para>
|
||||
Historically, credentials passing was implemented using
|
||||
ancillary data in the <function>sendmsg</function> and
|
||||
<function>recvmsg</function> functions. On some systems, only
|
||||
credentials data that the peer has explicitly sent can be
|
||||
received, and the kernel checks the data for correctness on the
|
||||
sending side. This means that both peers need to deal with
|
||||
ancillary data. Compared to that, the modern interfaces are
|
||||
easier to use. Both sets of interfaces vary considerably among
|
||||
UNIX-like systems, unfortunately.
|
||||
</para>
|
||||
<para>
|
||||
If you want to authenticate based on supplementary groups, you
|
||||
should obtain the user ID using one of these methods, and look
|
||||
up the list of supplementary groups using
|
||||
<function>getpwuid</function> (or
|
||||
<function>getpwuid_r</function>) and
|
||||
<function>getgrouplist</function>. Using the PID and
|
||||
information from <filename>/proc/PID/status</filename> is prone
|
||||
to race conditions and insecure.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Authentication-Netlink">
|
||||
<title><literal>AF_NETLINK</literal> Authentication of Origin</title>
|
||||
<!-- ??? kernel change may make this obsolete:
|
||||
https://bugzilla.redhat.com/show_bug.cgi?id=851968 -->
|
||||
<para>
|
||||
Netlink messages are used as a high-performance data transfer
|
||||
mechanism between the kernel and the user space. Traditionally,
|
||||
they are used to exchange information related to the network
|
||||
stack, such as routing table entries.
|
||||
</para>
|
||||
<para>
|
||||
When processing Netlink messages from the kernel, it is
|
||||
important to check that these messages actually originate from
|
||||
the kernel, by checking that the port ID (or PID) field
|
||||
<literal>nl_pid</literal> in the <literal>sockaddr_nl</literal>
|
||||
structure is <literal>0</literal>. (This structure can be
|
||||
obtained using <function>recvfrom</function> or
|
||||
<function>recvmsg</function>, it is different from the
|
||||
<literal>nlmsghdr</literal> structure.) The kernel does not
|
||||
prevent other processes from sending unicast Netlink messages,
|
||||
but the <literal>nl_pid</literal> field in the sender's socket
|
||||
address will be non-zero in such cases.
|
||||
</para>
|
||||
<para>
|
||||
Applications should not use <literal>AF_NETLINK</literal>
|
||||
sockets as an IPC mechanism among processes, but prefer UNIX
|
||||
domain sockets for this tasks.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
||||
|
|
@ -1,180 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-HSM">
|
||||
<title>Hardware Security Modules and Smart Cards</title>
|
||||
<para>
|
||||
Hardware Security Modules (HSMs) are specialized hardware intended
|
||||
to protect private keys on server systems. They store internally
|
||||
the private keys (e.g., RSA keys), and provide access to operations
|
||||
with the keys without exposing the keys. That access, is provided using
|
||||
a standardized API, which across Fedora is PKCS#11.
|
||||
</para>
|
||||
<para>
|
||||
Smart cards are small cards with a micro processor, often combined with a
|
||||
USB reader resembling a USB stick. They are very similar in nature with
|
||||
HSMs as they can also be used to protect private keys and are almost
|
||||
universally accessed via the PKCS#11 API. The main distinguishers from HSMs
|
||||
is their inferior performance and often, the available hardware protection mechanisms.
|
||||
</para>
|
||||
<para>
|
||||
Typically a smart card or HSM relies on a shared library to provide functionality.
|
||||
This shared library follows the PKCS#11 API and thus is often referred to as
|
||||
a PKCS#11 module. In Fedora the <literal>opensc</literal>
|
||||
shared module (<literal>opensc-pkcs11.so</literal>) can be used for the majority
|
||||
of smart cards available in the market. By convention these modules are located
|
||||
at <literal>/usr/lib64/pkcs11</literal>. They can be used directly, or via
|
||||
a higher level library.
|
||||
</para>
|
||||
<para>
|
||||
All the major crypto libraries (NSS, GnuTLS and OpenSSL in Fedora) support
|
||||
hardware security modules and smart cards, by providing wrappers over the
|
||||
PKCS#11 API. However, the level of support varies, as well as the ease of
|
||||
use of such modules and its integration to the overall library API.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The PKCS#11 API does provide an API to access HSMs or smart cards, but
|
||||
does not provide any method of discovering which HSMs or smart cards are
|
||||
available in the system. In Fedora and modules are registered via <ulink url="https://p11-glue.freedesktop.org/doc/p11-kit/pkcs11-conf.html">p11-kit
|
||||
configuration files</ulink>, stored at <literal>/etc/pkcs11/modules/</literal>. For applications using
|
||||
<literal>engine_pkcs11</literal> or GnuTLS the registered modules are
|
||||
available without further configuration. Other applications will have to load
|
||||
the <literal>p11-kit-proxy.so</literal> module.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Most crypto libraries support the <ulink url="https://tools.ietf.org/html/rfc7512">PKCS#11 URLs scheme</ulink>
|
||||
to identify objects stored in an HSM, however that support is not yet universal.
|
||||
Some support transparent usage of PKCS#11 objects, e.g., specifying
|
||||
a PKCS#11 object instead of a file, while others require to use
|
||||
specialized APIs for such objects.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Objects stored in an HSM or smart card can be protected with a PIN. As such,
|
||||
libraries typically require to set a PIN handling function for accessing private keys,
|
||||
or the PIN can be passed along with a PKCS#11 URL and the pin-value parameter.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Obtaining a Hardware Security Module, or including it on a continuous integration
|
||||
testing is not always feasible. For testing purposes smart cards supported by the OpenSC
|
||||
project can be used, as well as software modules like <literal>softhsm</literal> which
|
||||
provides a tool to setup a software HSM, and a PKCS#11 library.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The PKCS#11 API requires applications that use fork to reinitialize the used PKCS#11
|
||||
modules. This is an uncommon requirement, which has led to several bugs across
|
||||
applications in Fedora which used PKCS#11 directly. To make things more complicated
|
||||
software PKCS#11 module like <literal>softhsm</literal> do not require this re-initialization
|
||||
leading to applications working against software modules but failing with hardware
|
||||
modules or smart cards. The wrapper PKCS#11 APIs provided by NSS, GNUTLS and
|
||||
engine_pkcs11 (OpenSSL) handle the reinitialization after fork requirement transparently.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<section id="sect-Defensive_Coding-HSM-OpenSSL">
|
||||
<title>OpenSSL HSM Support</title>
|
||||
<para>
|
||||
OpenSSL does not have native support for PKCS#11. It can
|
||||
provide PKCS#11 support through the OpenSC's project
|
||||
<literal>pkcs11</literal> engine (formerly known as <literal>engine_pkcs11</literal>).
|
||||
As such software intended to use HSMs, must utilize that engine.
|
||||
</para>
|
||||
<para>
|
||||
Engine <literal>pkcs11</literal> supports loading stored objects via PKCS#11 URLs.
|
||||
If no PKCS#11 module is specified the engine will use the system-wide registered
|
||||
modules via <literal>p11-kit-proxy.so</literal>.
|
||||
</para>
|
||||
<para>
|
||||
The following example demonstrates the initialization of the pkcs11 engine
|
||||
and its usage to sign data.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-HSM-OpenSSL">
|
||||
<title>Signing data with HSM and OpenSSL</title>
|
||||
<xi:include href="snippets/Features-HSM-OpenSSL.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-HSM-GNUTLS">
|
||||
<title>GNUTLS HSM Support</title>
|
||||
<para>
|
||||
GNUTLS supports PKCS#11 natively. Most of the API functions
|
||||
accepting certificate files, can also accept PKCS#11 URLs, thus
|
||||
requiring minor or no modifications to applications in order
|
||||
to support HSMs. In most cases applications must be modified
|
||||
to install a PIN callback function.
|
||||
</para>
|
||||
<para>
|
||||
The following example demonstrates the initialization of the pkcs11 engine
|
||||
and its usage to sign data.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-HSM-GNUTLS">
|
||||
<title>Signing data with HSM and GnuTLS</title>
|
||||
<xi:include href="snippets/Features-HSM-GNUTLS.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The PIN callback function can be either set globally as in
|
||||
the example above or locally by utilizing functions such as <literal>gnutls_privkey_set_pin_function</literal>.
|
||||
An example PIN callback function is shown below.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-HSM-GNUTLS-PIN">
|
||||
<title>An example PIN callback with GNUTLS</title>
|
||||
<xi:include href="snippets/Features-HSM-GNUTLS-PIN.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-HSM-NSS">
|
||||
<title>NSS HSM Support</title>
|
||||
<para>
|
||||
NSS supports PKCS#11 natively. In fact all NSS crypto operations,
|
||||
including built-in operations, go through PKCS #11 modules. NSS provides
|
||||
its own software PKCS #11 module called softoken. NSS automatically
|
||||
loads any PKCS #11 module specified in its module database, which can
|
||||
be manipulated with the modutil command. NSS uses the PKCS #11 module
|
||||
that contains the requested keys to do the crypto operations. As long as
|
||||
the application opens an NSS database and properly sets a pin callback. If
|
||||
it runs with native NSS, it should be able to use HSMs that provide PKCS #11
|
||||
modules. Modules can also be loaded programatically, though this is less common.
|
||||
</para>
|
||||
<!-- loaded programatically = loaded automatically? -->
|
||||
<para>
|
||||
The following example demonstrates a typical NSS application for signing.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-HSM-NSS">
|
||||
<title>Signing data with HSM and NSS</title>
|
||||
<xi:include href="snippets/Features-HSM-NSS.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
To use the example above with an HSM or smart card you will need to do the following.
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
# add your HSM or token library to an NSS database (in the sample code the database is
|
||||
# located in the current directory'.')
|
||||
$ modutil -add "My HSM" -libfile ${path_to_pkcs11_file} -dbdir .
|
||||
# Find the token name on your HSM
|
||||
$ modutil -list -dbdir .
|
||||
# find the cert on your token
|
||||
$ certutil -L -h ${token_name} -d .
|
||||
# pass the cert to your signing program
|
||||
$ NSS_Sign_Example "${token_name}:${cert_name}"
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<example id="ex-Defensive_Coding-HSM-NSS-PIN">
|
||||
<title>An example PIN callback with NSS</title>
|
||||
<xi:include href="snippets/Features-HSM-NSS-PIN.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,941 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-TLS">
|
||||
<title>Transport Layer Security (TLS)</title>
|
||||
<para>
|
||||
Transport Layer Security (TLS, formerly Secure Sockets
|
||||
Layer/SSL) is the recommended way to to protect integrity and
|
||||
confidentiality while data is transferred over an untrusted
|
||||
network connection, and to identify the endpoint. At this
|
||||
chapter we describe the available libraries in Fedora as well
|
||||
as known pitfalls, and safe ways to write applications with them.
|
||||
</para>
|
||||
<para>
|
||||
When using any library, in addition to this guide, it is recommended to consult the
|
||||
library' documentation.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><ulink url="https://developer.mozilla.org/en-US/docs/Mozilla/Projects/NSS">NSS documentation</ulink></para></listitem>
|
||||
<listitem><para><ulink url="http://www.gnutls.org/manual/">GNUTLS documentation</ulink></para></listitem>
|
||||
<listitem><para><ulink url="https://www.openssl.org/docs/">OpenSSL documentation</ulink></para></listitem>
|
||||
<listitem><para><ulink url="https://docs.oracle.com/javase/8/docs/technotes/guides/security/jsse/JSSERefGuide.html">OpenJDK documentation</ulink></para></listitem>
|
||||
</itemizedlist>
|
||||
<section id="sect-Defensive_Coding-TLS-Pitfalls">
|
||||
<title>Common Pitfalls</title>
|
||||
<para>
|
||||
TLS implementations are difficult to use, and most of them lack
|
||||
a clean API design. The following sections contain
|
||||
implementation-specific advice, and some generic pitfalls are
|
||||
mentioned below.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Most TLS implementations have questionable default TLS
|
||||
cipher suites. Most of them enable anonymous Diffie-Hellman
|
||||
key exchange (but we generally want servers to authenticate
|
||||
themselves). Many do not disable ciphers which are subject
|
||||
to brute-force attacks because of restricted key lengths.
|
||||
Some even disable all variants of AES in the default
|
||||
configuration.
|
||||
</para>
|
||||
<para>
|
||||
When overriding the cipher suite defaults, it is recommended
|
||||
to disable all cipher suites which are not present on a
|
||||
whitelist, instead of simply enabling a list of cipher
|
||||
suites. This way, if an algorithm is disabled by default in
|
||||
the TLS implementation in a future security update, the
|
||||
application will not re-enable it.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The name which is used in certificate validation must match
|
||||
the name provided by the user or configuration file. No host
|
||||
name canonicalization or IP address lookup must be performed.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The TLS handshake has very poor performance if the TCP Nagle
|
||||
algorithm is active. You should switch on the
|
||||
<literal>TCP_NODELAY</literal> socket option (at least for the
|
||||
duration of the handshake), or use the Linux-specific
|
||||
<literal>TCP_CORK</literal> option.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Nagle">
|
||||
<title>Deactivating the TCP Nagle algorithm</title>
|
||||
<xi:include href="snippets/Features-TLS-Nagle.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Implementing proper session resumption decreases handshake
|
||||
overhead considerably. This is important if the upper-layer
|
||||
protocol uses short-lived connections (like most application
|
||||
of HTTPS).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Both client and server should work towards an orderly
|
||||
connection shutdown, that is send
|
||||
<literal>close_notify</literal> alerts and respond to them.
|
||||
This is especially important if the upper-layer protocol
|
||||
does not provide means to detect connection truncation (like
|
||||
some uses of HTTP).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
When implementing a server using event-driven programming,
|
||||
it is important to handle the TLS handshake properly because
|
||||
it includes multiple network round-trips which can block
|
||||
when an ordinary TCP <function>accept</function> would not.
|
||||
Otherwise, a client which fails to complete the TLS
|
||||
handshake for some reason will prevent the server from
|
||||
handling input from other clients.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Unlike regular file descriptors, TLS connections cannot be
|
||||
passed between processes. Some TLS implementations add
|
||||
additional restrictions, and TLS connections generally
|
||||
cannot be used across <function>fork</function> function
|
||||
calls (see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Processes-Fork-Parallel"/>).
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<section id="sect-Defensive_Coding-TLS-OpenSSL">
|
||||
<title>OpenSSL Pitfalls</title>
|
||||
<para>
|
||||
Some OpenSSL function use <emphasis>tri-state return
|
||||
values</emphasis>. Correct error checking is extremely
|
||||
important. Several functions return <literal>int</literal>
|
||||
values with the following meaning:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The value <literal>1</literal> indicates success (for
|
||||
example, a successful signature verification).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The value <literal>0</literal> indicates semantic
|
||||
failure (for example, a signature verification which was
|
||||
unsuccessful because the signing certificate was
|
||||
self-signed).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The value <literal>-1</literal> indicates a low-level
|
||||
error in the system, such as failure to allocate memory
|
||||
using <function>malloc</function>.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Treating such tri-state return values as booleans can lead
|
||||
to security vulnerabilities. Note that some OpenSSL
|
||||
functions return boolean results or yet another set of
|
||||
status indicators. Each function needs to be checked
|
||||
individually.
|
||||
</para>
|
||||
<para>
|
||||
Recovering precise error information is difficult.
|
||||
<xref linkend="ex-Defensive_Coding-TLS-OpenSSL-Errors"/>
|
||||
shows how to obtain a more precise error code after a function
|
||||
call on an <literal>SSL</literal> object has failed. However,
|
||||
there are still cases where no detailed error information is
|
||||
available (e.g., if <function>SSL_shutdown</function> fails
|
||||
due to a connection teardown by the other end).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenSSL-Errors">
|
||||
<title>Obtaining OpenSSL error codes</title>
|
||||
<xi:include href="snippets/Features-TLS-OpenSSL-Errors.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The <function>OPENSSL_config</function> function is
|
||||
documented to never fail. In reality, it can terminate the
|
||||
entire process if there is a failure accessing the
|
||||
configuration file. An error message is written to standard
|
||||
error, but which might not be visible if the function is
|
||||
called from a daemon process.
|
||||
</para>
|
||||
<para>
|
||||
OpenSSL contains two separate ASN.1 DER decoders. One set
|
||||
of decoders operate on BIO handles (the input/output stream
|
||||
abstraction provided by OpenSSL); their decoder function
|
||||
names start with <literal>d2i_</literal> and end in
|
||||
<literal>_fp</literal> or <literal>_bio</literal> (e.g.,
|
||||
<function>d2i_X509_fp</function> or
|
||||
<function>d2i_X509_bio</function>). These decoders must not
|
||||
be used for parsing data from untrusted sources; instead,
|
||||
the variants without the <literal>_fp</literal> and
|
||||
<literal>_bio</literal> (e.g.,
|
||||
<function>d2i_X509</function>) shall be used. The BIO
|
||||
variants have received considerably less testing and are not
|
||||
very robust.
|
||||
</para>
|
||||
<para>
|
||||
For the same reason, the OpenSSL command line tools (such as
|
||||
<command>openssl x509</command>) are generally generally less
|
||||
robust than the actual library code. They use the BIO
|
||||
functions internally, and not the more robust variants.
|
||||
</para>
|
||||
<para>
|
||||
The command line tools do not always indicate failure in the
|
||||
exit status of the <application>openssl</application> process.
|
||||
For instance, a verification failure in <command>openssl
|
||||
verify</command> result in an exit status of zero.
|
||||
</para>
|
||||
<para>
|
||||
OpenSSL command-line commands, such as <command>openssl
|
||||
genrsa</command>, do not ensure that physical entropy is used
|
||||
for key generation—they obtain entropy from
|
||||
<filename>/dev/urandom</filename> and other sources, but not
|
||||
from <filename>/dev/random</filename>. This can result in
|
||||
weak keys if the system lacks a proper entropy source (e.g., a
|
||||
virtual machine with solid state storage). Depending on local
|
||||
policies, keys generated by these OpenSSL tools should not be
|
||||
used in high-value, critical functions.
|
||||
</para>
|
||||
<para>
|
||||
The OpenSSL server and client applications (<command>openssl
|
||||
s_client</command> and <command>openssl s_server</command>)
|
||||
are debugging tools and should <emphasis>never</emphasis> be
|
||||
used as generic clients. For instance, the
|
||||
<application>s_client</application> tool reacts in a
|
||||
surprising way to lines starting with <literal>R</literal> and
|
||||
<literal>Q</literal>.
|
||||
</para>
|
||||
<para>
|
||||
OpenSSL allows application code to access private key
|
||||
material over documented interfaces. This can significantly
|
||||
increase the part of the code base which has to undergo
|
||||
security certification.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Pitfalls-GNUTLS">
|
||||
<title>GNUTLS Pitfalls</title>
|
||||
<para>
|
||||
Older versions of GNUTLS had several peculiarities described
|
||||
in previous versions of this guide; as of GNUTLS 3.3.10, these
|
||||
issues are no longer applicable.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Pitfalls-OpenJDK">
|
||||
<title>OpenJDK Pitfalls</title>
|
||||
<para>
|
||||
The Java cryptographic framework is highly modular. As a
|
||||
result, when you request an object implementing some
|
||||
cryptographic functionality, you cannot be completely sure
|
||||
that you end up with the well-tested, reviewed implementation
|
||||
in OpenJDK.
|
||||
</para>
|
||||
<para>
|
||||
OpenJDK (in the source code as published by Oracle) and other
|
||||
implementations of the Java platform require that the system
|
||||
administrator has installed so-called <emphasis>unlimited
|
||||
strength jurisdiction policy files</emphasis>. Without this
|
||||
step, it is not possible to use the secure algorithms which
|
||||
offer sufficient cryptographic strength. Most downstream
|
||||
redistributors of OpenJDK remove this requirement.
|
||||
</para>
|
||||
<para>
|
||||
Some versions of OpenJDK use <filename>/dev/random</filename>
|
||||
as the randomness source for nonces and other random data
|
||||
which is needed for TLS operation, but does not actually
|
||||
require physical randomness. As a result, TLS applications
|
||||
can block, waiting for more bits to become available in
|
||||
<filename>/dev/random</filename>.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Pitfalls-NSS">
|
||||
<title>NSS Pitfalls</title>
|
||||
<para>
|
||||
NSS was not designed to be used by other libraries which can
|
||||
be linked into applications without modifying them. There is
|
||||
a lot of global state. There does not seem to be a way to
|
||||
perform required NSS initialization without race conditions.
|
||||
</para>
|
||||
<para>
|
||||
If the NSPR descriptor is in an unexpected state, the
|
||||
<function>SSL_ForceHandshake</function> function can succeed,
|
||||
but no TLS handshake takes place, the peer is not
|
||||
authenticated, and subsequent data is exchanged in the clear.
|
||||
</para>
|
||||
<para>
|
||||
NSS disables itself if it detects that the process underwent a
|
||||
<function>fork</function> after the library has been
|
||||
initialized. This behavior is required by the PKCS#11 API
|
||||
specification.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Client">
|
||||
<title>TLS Clients</title>
|
||||
<para>
|
||||
Secure use of TLS in a client generally involves all of the
|
||||
following steps. (Individual instructions for specific TLS
|
||||
implementations follow in the next sections.)
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The client must configure the TLS library to use a set of
|
||||
trusted root certificates. These certificates are provided
|
||||
by the system in various formats and files. These are documented in <literal>update-ca-trust</literal>
|
||||
man page in Fedora. Portable applications should not hard-code
|
||||
any paths; they should rely on APIs which set the default
|
||||
for the system trust store.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The client selects sufficiently strong cryptographic
|
||||
primitives and disables insecure ones (such as no-op
|
||||
encryption). Compression support and SSL version 3 or lower must be
|
||||
disabled (including the SSLv2-compatible handshake).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The client initiates the TLS connection. The Server Name
|
||||
Indication extension should be used if supported by the
|
||||
TLS implementation. Before switching to the encrypted
|
||||
connection state, the contents of all input and output
|
||||
buffers must be discarded.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The client needs to validate the peer certificate provided
|
||||
by the server, that is, the client must check that there
|
||||
is a cryptographically protected chain from a trusted root
|
||||
certificate to the peer certificate. (Depending on the
|
||||
TLS implementation, a TLS handshake can succeed even if
|
||||
the certificate cannot be validated.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The client must check that the configured or user-provided
|
||||
server name matches the peer certificate provided by the
|
||||
server.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
It is safe to provide users detailed diagnostics on
|
||||
certificate validation failures. Other causes of handshake
|
||||
failures and, generally speaking, any details on other errors
|
||||
reported by the TLS implementation (particularly exception
|
||||
tracebacks), must not be divulged in ways that make them
|
||||
accessible to potential attackers. Otherwise, it is possible
|
||||
to create decryption oracles.
|
||||
</para>
|
||||
<important>
|
||||
<para>
|
||||
Depending on the application, revocation checking (against
|
||||
certificate revocations lists or via OCSP) and session
|
||||
resumption are important aspects of production-quality
|
||||
client. These aspects are not yet covered.
|
||||
</para>
|
||||
</important>
|
||||
<section>
|
||||
<title>Implementation TLS Clients With OpenSSL</title>
|
||||
<para>
|
||||
In the following code, the error handling is only exploratory.
|
||||
Proper error handling is required for production use,
|
||||
especially in libraries.
|
||||
<!-- FIXME: Cross-reference event-driven I/O section when it
|
||||
exists and mention that this is really quite complex to
|
||||
implement. -->
|
||||
</para>
|
||||
<para>
|
||||
The OpenSSL library needs explicit initialization (see <xref
|
||||
linkend="ex-Defensive_Coding-TLS-OpenSSL-Init"/>).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenSSL-Init">
|
||||
<title>OpenSSL library initialization</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenSSL-Init.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
After that, a context object has to be created, which acts as
|
||||
a factory for connection objects (<xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-OpenSSL-CTX"/>). We
|
||||
use an explicit cipher list so that we do not pick up any
|
||||
strange ciphers when OpenSSL is upgraded. The actual version
|
||||
requested in the client hello depends on additional
|
||||
restrictions in the OpenSSL library. If possible, you should
|
||||
follow the example code and use the default list of trusted
|
||||
root certificate authorities provided by the system because
|
||||
you would have to maintain your own set otherwise, which can
|
||||
be cumbersome.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-OpenSSL-CTX">
|
||||
<title>OpenSSL client context creation</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenSSL-CTX.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
A single context object can be used to create multiple
|
||||
connection objects. It is safe to use the same
|
||||
<literal>SSL_CTX</literal> object for creating connections
|
||||
concurrently from multiple threads, provided that the
|
||||
<literal>SSL_CTX</literal> object is not modified (e.g.,
|
||||
callbacks must not be changed).
|
||||
</para>
|
||||
<para>
|
||||
After creating the TCP socket and disabling the Nagle
|
||||
algorithm (per <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Nagle"/>), the actual
|
||||
connection object needs to be created, as show in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-OpenSSL-CTX"/>. If
|
||||
the handshake started by <function>SSL_connect</function>
|
||||
fails, the <function>ssl_print_error_and_exit</function>
|
||||
function from <xref
|
||||
linkend="ex-Defensive_Coding-TLS-OpenSSL-Errors"/> is called.
|
||||
</para>
|
||||
<para>
|
||||
The <function>certificate_validity_override</function>
|
||||
function provides an opportunity to override the validity of
|
||||
the certificate in case the OpenSSL check fails. If such
|
||||
functionality is not required, the call can be removed,
|
||||
otherwise, the application developer has to implement it.
|
||||
</para>
|
||||
<para>
|
||||
The host name passed to the functions
|
||||
<function>SSL_set_tlsext_host_name</function> and
|
||||
<function>X509_check_host</function> must be the name that was
|
||||
passed to <function>getaddrinfo</function> or a similar name
|
||||
resolution function. No host name canonicalization must be
|
||||
performed. The <function>X509_check_host</function> function
|
||||
used in the final step for host name matching is currently
|
||||
only implemented in OpenSSL 1.1, which is not released yet.
|
||||
In case host name matching fails, the function
|
||||
<function>certificate_host_name_override</function> is called.
|
||||
This function should check user-specific certificate store, to
|
||||
allow a connection even if the host name does not match the
|
||||
certificate. This function has to be provided by the
|
||||
application developer. Note that the override must be keyed
|
||||
by both the certificate <emphasis>and</emphasis> the host
|
||||
name.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-OpenSSL-Connect">
|
||||
<title>Creating a client connection using OpenSSL</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenSSL-Connect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The connection object can be used for sending and receiving
|
||||
data, as in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-OpenSSL-Connection-Use"/>.
|
||||
It is also possible to create a <literal>BIO</literal> object
|
||||
and use the <literal>SSL</literal> object as the underlying
|
||||
transport, using <function>BIO_set_ssl</function>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenSSL-Connection-Use">
|
||||
<title>Using an OpenSSL connection to send and receive data</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenSSL-Connection-Use.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
When it is time to close the connection, the
|
||||
<function>SSL_shutdown</function> function needs to be called
|
||||
twice for an orderly, synchronous connection termination
|
||||
(<xref
|
||||
linkend="ex-Defensive_Coding-TLS-OpenSSL-Connection-Close"/>).
|
||||
This exchanges <literal>close_notify</literal> alerts with the
|
||||
server. The additional logic is required to deal with an
|
||||
unexpected <literal>close_notify</literal> from the server.
|
||||
Note that is necessary to explicitly close the underlying
|
||||
socket after the connection object has been freed.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenSSL-Connection-Close">
|
||||
<title>Closing an OpenSSL connection in an orderly fashion</title>
|
||||
<xi:include href="snippets/Features-TLS-OpenSSL-Connection-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-TLS-OpenSSL-Context-Close"/> shows how
|
||||
to deallocate the context object when it is no longer needed
|
||||
because no further TLS connections will be established.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenSSL-Context-Close">
|
||||
<title>Closing an OpenSSL connection in an orderly fashion</title>
|
||||
<xi:include href="snippets/Features-TLS-OpenSSL-Context-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Client-GNUTLS">
|
||||
<title>Implementation TLS Clients With GNUTLS</title>
|
||||
<para>
|
||||
This section describes how to implement a TLS client with full
|
||||
certificate validation (but without certificate revocation
|
||||
checking). Note that the error handling in is only
|
||||
exploratory and needs to be replaced before production use.
|
||||
</para>
|
||||
<para>
|
||||
Before setting up TLS connections, a credentials objects has
|
||||
to be allocated and initialized with the set of trusted root
|
||||
CAs (<xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-GNUTLS-Credentials"/>).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-GNUTLS-Credentials">
|
||||
<title>Initializing a GNUTLS credentials structure</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-GNUTLS-Credentials.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
After the last TLS connection has been closed, this credentials
|
||||
object should be freed:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Features-TLS-GNUTLS-Credentials-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
During its lifetime, the credentials object can be used to
|
||||
initialize TLS session objects from multiple threads, provided
|
||||
that it is not changed.
|
||||
</para>
|
||||
<para>
|
||||
Once the TCP connection has been established, the Nagle
|
||||
algorithm should be disabled (see <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Nagle"/>). After that, the
|
||||
socket can be associated with a new GNUTLS session object.
|
||||
The previously allocated credentials object provides the set
|
||||
of root CAs. Then the TLS handshake must be initiated.
|
||||
This is shown in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-GNUTLS-Connect"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-GNUTLS-Connect">
|
||||
<title>Establishing a TLS client connection using GNUTLS</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-GNUTLS-Connect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
After the handshake has been completed, the server certificate
|
||||
needs to be verified against the server's hostname (<xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-GNUTLS-Verify"/>). In
|
||||
the example, the user-defined
|
||||
<function>certificate_validity_override</function> function is
|
||||
called if the verification fails, so that a separate,
|
||||
user-specific trust store can be checked. This function call
|
||||
can be omitted if the functionality is not needed.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-GNUTLS-Verify">
|
||||
<title>Verifying a server certificate using GNUTLS</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-GNUTLS-Verify.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
An established TLS session can be used for sending and
|
||||
receiving data, as in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-GNUTLS-Use"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-GNUTLS-Use">
|
||||
<title>Using a GNUTLS session</title>
|
||||
<xi:include href="snippets/Features-TLS-GNUTLS-Use.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
In order to shut down a connection in an orderly manner, you
|
||||
should call the <function>gnutls_bye</function> function.
|
||||
Finally, the session object can be deallocated using
|
||||
<function>gnutls_deinit</function> (see <xref
|
||||
linkend="ex-Defensive_Coding-TLS-GNUTLS-Disconnect"/>).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-GNUTLS-Disconnect">
|
||||
<title>Closing a GNUTLS session in an orderly fashion</title>
|
||||
<xi:include href="snippets/Features-TLS-GNUTLS-Disconnect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Client-OpenJDK">
|
||||
<title>Implementing TLS Clients With OpenJDK</title>
|
||||
<para>
|
||||
The examples below use the following cryptographic-related
|
||||
classes:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Import.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
If compatibility with OpenJDK 6 is required, it is necessary
|
||||
to use the internal class
|
||||
<literal>sun.security.util.HostnameChecker</literal>. (The
|
||||
public OpenJDK API does not provide any support for dissecting
|
||||
the subject distinguished name of an X.509 certificate, so a
|
||||
custom-written DER parser is needed—or we have to use an
|
||||
internal class, which we do below.) In OpenJDK 7, the
|
||||
<function>setEndpointIdentificationAlgorithm</function> method
|
||||
was added to the
|
||||
<literal>javax.net.ssl.SSLParameters</literal> class,
|
||||
providing an official way to implement host name checking.
|
||||
</para>
|
||||
<para>
|
||||
TLS connections are established using an
|
||||
<literal>SSLContext</literal> instance. With a properly
|
||||
configured OpenJDK installation, the
|
||||
<literal>SunJSSE</literal> provider uses the system-wide set
|
||||
of trusted root certificate authorities, so no further
|
||||
configuration is necessary. For backwards compatibility with
|
||||
OpenJDK 6, the <literal>TLSv1</literal> provider has to
|
||||
be supported as a fall-back option. This is shown in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-OpenJDK-Context"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-OpenJDK-Context">
|
||||
<title>Setting up an <literal>SSLContext</literal> for OpenJDK TLS
|
||||
clients</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Context.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
In addition to the context, a TLS parameter object will be
|
||||
needed which adjusts the cipher suites and protocols (<xref
|
||||
linkend="ex-Defensive_Coding-TLS-OpenJDK-Parameters"/>). Like
|
||||
the context, these parameters can be reused for multiple TLS
|
||||
connections.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-OpenJDK-Parameters">
|
||||
<title>Setting up <literal>SSLParameters</literal> for TLS use
|
||||
with OpenJDK</title>
|
||||
<xi:include href="snippets/Features-TLS-OpenJDK-Parameters.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
As initialized above, the parameter object does not yet
|
||||
require host name checking. This has to be enabled
|
||||
separately, and this is only supported by OpenJDK 7 and later:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Hostname.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
All application protocols can use the
|
||||
<literal>"HTTPS"</literal> algorithm. (The algorithms have
|
||||
minor differences with regard to wildcard handling, which
|
||||
should not matter in practice.)
|
||||
</para>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-TLS-Client-OpenJDK-Connect"/>
|
||||
shows how to establish the connection. Before the handshake
|
||||
is initialized, the protocol and cipher configuration has to
|
||||
be performed, by applying the parameter object
|
||||
<literal>params</literal>. (After this point, changes to
|
||||
<literal>params</literal> will not affect this TLS socket.)
|
||||
As mentioned initially, host name checking requires using an
|
||||
internal API on OpenJDK 6.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-OpenJDK-Connect">
|
||||
<title>Establishing a TLS connection with OpenJDK</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Connect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Starting with OpenJDK 7, the last lines can be omitted,
|
||||
provided that host name verification has been enabled by
|
||||
calling the
|
||||
<function>setEndpointIdentificationAlgorithm</function> method
|
||||
on the <literal>params</literal> object (before it was applied
|
||||
to the socket).
|
||||
</para>
|
||||
<para>
|
||||
The TLS socket can be used as a regular socket, as shown in
|
||||
<xref linkend="ex-Defensive_Coding-TLS-Client-OpenJDK-Use"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-OpenJDK-Use">
|
||||
<title>Using a TLS client socket in OpenJDK</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Use.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<section>
|
||||
<title>Overriding server certificate validation with OpenJDK 6</title>
|
||||
<para>
|
||||
Overriding certificate validation requires a custom trust
|
||||
manager. With OpenJDK 6, the trust manager lacks
|
||||
information about the TLS session, and to which server the
|
||||
connection is made. Certificate overrides have to be tied
|
||||
to specific servers (host names). Consequently, different
|
||||
<literal>TrustManager</literal> and
|
||||
<literal>SSLContext</literal> objects have to be used for
|
||||
different servers.
|
||||
</para>
|
||||
<para>
|
||||
In the trust manager shown in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-MyTrustManager"/>,
|
||||
the server certificate is identified by its SHA-256 hash.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-MyTrustManager">
|
||||
<title>A customer trust manager for OpenJDK TLS clients</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-MyTrustManager.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
This trust manager has to be passed to the
|
||||
<literal>init</literal> method of the
|
||||
<literal>SSLContext</literal> object, as show in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-Context_For_Cert"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-Context_For_Cert">
|
||||
<title>Using a custom TLS trust manager with OpenJDK</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-OpenJDK-Context_For_Cert.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
When certificate overrides are in place, host name
|
||||
verification should not be performed because there is no
|
||||
security requirement that the host name in the certificate
|
||||
matches the host name used to establish the connection (and
|
||||
it often will not). However, without host name
|
||||
verification, it is not possible to perform transparent
|
||||
fallback to certification validation using the system
|
||||
certificate store.
|
||||
</para>
|
||||
<para>
|
||||
The approach described above works with OpenJDK 6 and later
|
||||
versions. Starting with OpenJDK 7, it is possible to use a
|
||||
custom subclass of the
|
||||
<literal>javax.net.ssl.X509ExtendedTrustManager</literal>
|
||||
class. The OpenJDK TLS implementation will call the new
|
||||
methods, passing along TLS session information. This can be
|
||||
used to implement certificate overrides as a fallback (if
|
||||
certificate or host name verification fails), and a trust
|
||||
manager object can be used for multiple servers because the
|
||||
server address is available to the trust manager.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Client-NSS">
|
||||
<title>Implementing TLS Clients With NSS</title>
|
||||
<para>
|
||||
The following code shows how to implement a simple TLS client
|
||||
using NSS. These instructions apply to NSS version 3.14 and
|
||||
later. Versions before 3.14 need different initialization
|
||||
code.
|
||||
</para>
|
||||
<para>
|
||||
Keep in mind that the error handling needs to be improved
|
||||
before the code can be used in production.
|
||||
</para>
|
||||
<para>
|
||||
Using NSS needs several header files, as shown in
|
||||
<xref linkend="ex-Defensive_Coding-TLS-NSS-Includes"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-NSS-Includes">
|
||||
<title>Include files for NSS</title>
|
||||
<xi:include href="snippets/Features-TLS-NSS-Includes.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Initializing the NSS library is shown in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-NSS-Init"/>. This
|
||||
initialization procedure overrides global state. We only call
|
||||
<function>NSS_SetDomesticPolicy</function> if there are no
|
||||
strong ciphers available, assuming that it has already been
|
||||
called otherwise. This avoids overriding the process-wide
|
||||
cipher suite policy unnecessarily.
|
||||
</para>
|
||||
<para>
|
||||
The simplest way to configured the trusted root certificates
|
||||
involves loading the <filename>libnssckbi.so</filename> NSS
|
||||
module with a call to the
|
||||
<function>SECMOD_LoadUserModule</function> function. The root
|
||||
certificates are compiled into this module. (The PEM module
|
||||
for NSS, <filename>libnsspem.so</filename>, offers a way to
|
||||
load trusted CA certificates from a file.)
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-NSS-Init">
|
||||
<title>Initializing the NSS library</title>
|
||||
<xi:include href="snippets/Features-TLS-NSS-Init.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Some of the effects of the initialization can be reverted with
|
||||
the following function calls:
|
||||
</para>
|
||||
<informalexample id="ex-Defensive_Coding-TLS-NSS-Close">
|
||||
<xi:include href="snippets/Features-TLS-NSS-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
After NSS has been initialized, the TLS connection can be
|
||||
created (<xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-NSS-Connect"/>). The
|
||||
internal <function>PR_ImportTCPSocket</function> function is
|
||||
used to turn the POSIX file descriptor
|
||||
<literal>sockfd</literal> into an NSPR file descriptor. (This
|
||||
function is de-facto part of the NSS public ABI, so it will
|
||||
not go away.) Creating the TLS-capable file descriptor
|
||||
requires a <emphasis>model</emphasis> descriptor, which is
|
||||
configured with the desired set of protocols. The model
|
||||
descriptor is not needed anymore after TLS support has been
|
||||
activated for the existing connection descriptor.
|
||||
</para>
|
||||
<para>
|
||||
The call to <function>SSL_BadCertHook</function> can be
|
||||
omitted if no mechanism to override certificate verification
|
||||
is needed. The <literal>bad_certificate</literal> function
|
||||
must check both the host name specified for the connection and
|
||||
the certificate before granting the override.
|
||||
</para>
|
||||
<para>
|
||||
Triggering the actual handshake requires three function calls,
|
||||
<function>SSL_ResetHandshake</function>,
|
||||
<function>SSL_SetURL</function>, and
|
||||
<function>SSL_ForceHandshake</function>. (If
|
||||
<function>SSL_ResetHandshake</function> is omitted,
|
||||
<function>SSL_ForceHandshake</function> will succeed, but the
|
||||
data will not be encrypted.) During the handshake, the
|
||||
certificate is verified and matched against the host name.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-NSS-Connect">
|
||||
<title>Creating a TLS connection with NSS</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-NSS-Connect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
After the connection has been established, <xref
|
||||
linkend="ex-Defensive_Coding-TLS-NSS-Use"/> shows how to use
|
||||
the NSPR descriptor to communicate with the server.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-NSS-Use">
|
||||
<title>Using NSS for sending and receiving data</title>
|
||||
<xi:include href="snippets/Features-TLS-NSS-Use.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-TLS-Client-NSS-Close"/>
|
||||
shows how to close the connection.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-NSS-Close">
|
||||
<title>Closing NSS client connections</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-NSS-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-TLS-Client-Python">
|
||||
<title>Implementing TLS Clients With Python</title>
|
||||
<para>
|
||||
The Python distribution provides a TLS implementation in the
|
||||
<literal>ssl</literal> module (actually a wrapper around
|
||||
OpenSSL). The exported interface is somewhat restricted, so
|
||||
that the client code shown below does not fully implement the
|
||||
recommendations in <xref
|
||||
linkend="sect-Defensive_Coding-TLS-OpenSSL"/>.
|
||||
</para>
|
||||
<important>
|
||||
<para>
|
||||
Currently, most Python function which accept
|
||||
<literal>https://</literal> URLs or otherwise implement
|
||||
HTTPS support do not perform certificate validation at all.
|
||||
(For example, this is true for the <literal>httplib</literal>
|
||||
and <literal>xmlrpclib</literal> modules.) If you use
|
||||
HTTPS, you should not use the built-in HTTP clients. The
|
||||
<literal>Curl</literal> class in the <literal>curl</literal>
|
||||
module, as provided by the <literal>python-pycurl</literal>
|
||||
package implements proper certificate validation.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
The <literal>ssl</literal> module currently does not perform
|
||||
host name checking on the server certificate. <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-Python-check_host_name"/>
|
||||
shows how to implement certificate matching, using the parsed
|
||||
certificate returned by <function>getpeercert</function>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-Python-check_host_name">
|
||||
<title>Implementing TLS host name checking Python (without
|
||||
wildcard support)</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-Python-check_host_name.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
To turn a regular, connected TCP socket into a TLS-enabled
|
||||
socket, use the <function>ssl.wrap_socket</function> function.
|
||||
The function call in <xref
|
||||
linkend="ex-Defensive_Coding-TLS-Client-Python-Connect"/>
|
||||
provides additional arguments to override questionable
|
||||
defaults in OpenSSL and in the Python module.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>ciphers="HIGH:-aNULL:-eNULL:-PSK:RC4-SHA:RC4-MD5"</literal>
|
||||
selects relatively strong cipher suites with
|
||||
certificate-based authentication. (The call to
|
||||
<function>check_host_name</function> function provides
|
||||
additional protection against anonymous cipher suites.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>ssl_version=ssl.PROTOCOL_TLSv1</literal> disables
|
||||
SSL 2.0 support. By default, the <literal>ssl</literal>
|
||||
module sends an SSL 2.0 client hello, which is rejected by
|
||||
some servers. Ideally, we would request OpenSSL to
|
||||
negotiated the most recent TLS version supported by the
|
||||
server and the client, but the Python module does not
|
||||
allow this.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>cert_reqs=ssl.CERT_REQUIRED</literal> turns on
|
||||
certificate validation.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<literal>ca_certs='/etc/ssl/certs/ca-bundle.crt'</literal>
|
||||
initializes the certificate store with a set of trusted
|
||||
root CAs. Unfortunately, it is necessary to hard-code
|
||||
this path into applications because the default path in
|
||||
OpenSSL is not available through the Python
|
||||
<literal>ssl</literal> module.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
The <literal>ssl</literal> module (and OpenSSL) perform
|
||||
certificate validation, but the certificate must be compared
|
||||
manually against the host name, by calling the
|
||||
<function>check_host_name</function> defined above.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-TLS-Client-Python-Connect">
|
||||
<title>Establishing a TLS client connection with Python</title>
|
||||
<xi:include href="snippets/Features-TLS-Client-Python-Connect.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
After the connection has been established, the TLS socket can
|
||||
be used like a regular socket:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Features-TLS-Python-Use.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<para>
|
||||
Closing the TLS socket is straightforward as well:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Features-TLS-Python-Close.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
</section>
|
||||
</section>
|
||||
</chapter>
|
110
en-US/Go.xml
110
en-US/Go.xml
|
@ -1,110 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Go">
|
||||
<title>The Go Programming Language</title>
|
||||
<para>
|
||||
This chapter contains language-specific recommendations for Go.
|
||||
</para>
|
||||
<section id="chap-Defensive_Coding-Go-Memory_Safety">
|
||||
<title>Memory Safety</title>
|
||||
<para>
|
||||
Go provides memory safety, but only if the program is not executed
|
||||
in parallel (that is, <envar>GOMAXPROCS</envar> is not larger than
|
||||
<literal>1</literal>). The reason is that interface values and
|
||||
slices consist of multiple words are not updated atomically.
|
||||
Another thread of execution can observe an inconsistent pairing
|
||||
between type information and stored value (for interfaces) or
|
||||
pointer and length (for slices), and such inconsistency can lead
|
||||
to a memory safety violation.
|
||||
</para>
|
||||
<para>
|
||||
Code which does not run in parallel and does not use the
|
||||
<literal>unsafe</literal> package (or other packages which expose
|
||||
unsafe constructs) is memory-safe. For example, invalid casts and
|
||||
out-of-range subscripting cause panics at run time.
|
||||
</para>
|
||||
<para>
|
||||
Keep in mind that finalization can introduce parallelism because
|
||||
finalizers are executed concurrently, potentially interleaved with
|
||||
the rest of the program.
|
||||
</para>
|
||||
</section>
|
||||
<section id="chap-Defensive_Coding-Go-Error_Handling">
|
||||
<title>Error Handling</title>
|
||||
<para>
|
||||
Only a few common operations (such as pointer dereference, integer
|
||||
division, array subscripting) trigger exceptions in Go, called
|
||||
<emphasis>panics</emphasis>. Most interfaces in the standard
|
||||
library use a separate return value of type
|
||||
<literal>error</literal> to signal error.
|
||||
</para>
|
||||
<para>
|
||||
Not checking error return values can lead to incorrect operation
|
||||
and data loss (especially in the case of writes, using interfaces
|
||||
such as <literal>io.Writer</literal>).
|
||||
</para>
|
||||
<para>
|
||||
The correct way to check error return values depends on the
|
||||
function or method being called. In the majority of cases, the
|
||||
first step after calling a function should be an error check
|
||||
against the <literal>nil</literal> value, handling any encountered
|
||||
error. See <xref
|
||||
linkend="ex-Defensive_Coding-Go-Error_Handling-Regular"/> for
|
||||
details.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Go-Error_Handling-Regular">
|
||||
<title>Regular error handling in Go</title>
|
||||
<xi:include href="snippets/Go-Error_Handling-Regular.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
However, with <literal>io.Reader</literal>,
|
||||
<literal>io.ReaderAt</literal> and related interfaces, it is
|
||||
necessary to check for a non-zero number of read bytes first, as
|
||||
shown in <xref
|
||||
linkend="ex-Defensive_Coding-Go-Error_Handling-IO"/>. If this
|
||||
pattern is not followed, data loss may occur. This is due to the
|
||||
fact that the <literal>io.Reader</literal> interface permits
|
||||
returning both data and an error at the same time.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Go-Error_Handling-IO">
|
||||
<title>Read error handling in Go</title>
|
||||
<xi:include href="snippets/Go-Error_Handling-IO.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="chap-Defensive_Coding-Go-Garbage_Collector">
|
||||
<title>Garbage Collector</title>
|
||||
<para>
|
||||
Older Go releases (before Go 1.3) use a conservative garbage
|
||||
collector without blacklisting. This means that data blobs can
|
||||
cause retention of unrelated data structures because the data is
|
||||
conservatively interpreted as pointers. This phenomenon can be
|
||||
triggered accidentally on 32-bit architectures and is more likely
|
||||
to occur if the heap grows larger. On 64-bit architectures, it
|
||||
may be possible to trigger it deliberately—it is unlikely to occur
|
||||
spontaneously.
|
||||
</para>
|
||||
</section>
|
||||
<section id="chap-Defensive_Coding-Go-Marshaling">
|
||||
<title>Marshaling and Unmarshaling</title>
|
||||
<para>
|
||||
Several packages in the <literal>encoding</literal> hierarchy
|
||||
provide support for serialization and deserialization. The usual
|
||||
caveats apply (see
|
||||
<xref linkend="chap-Defensive_Coding-Tasks-Serialization"/>).
|
||||
</para>
|
||||
<para>
|
||||
As an additional precaution, the <function>Unmarshal</function>
|
||||
and <function>Decode</function> functions should only be used with
|
||||
fresh values in the <literal>interface{}</literal> argument. This
|
||||
is due to the way defaults for missing values are implemented:
|
||||
During deserialization, missing value do not result in an error,
|
||||
but the original value is preserved. Using a fresh value (with
|
||||
suitable default values if necessary) ensures that data from a
|
||||
previous deserialization operation does not leak into the current
|
||||
one. This is especially relevant when structs are deserialized.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,291 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-Java-Language">
|
||||
<title>The Core Language</title>
|
||||
<para>
|
||||
Implementations of the Java programming language provide strong
|
||||
memory safety, even in the presence of data races in concurrent
|
||||
code. This prevents a large range of security vulnerabilities
|
||||
from occurring, unless certain low-level features are used; see
|
||||
<xref linkend="sect-Defensive_Coding-Java-LowLevel"/>.
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Language-ReadArray">
|
||||
<title>Increasing Robustness when Reading Arrays</title>
|
||||
<para>
|
||||
External data formats often include arrays, and the data is
|
||||
stored as an integer indicating the number of array elements,
|
||||
followed by this number of elements in the file or protocol data
|
||||
unit. This length specified can be much larger than what is
|
||||
actually available in the data source.
|
||||
</para>
|
||||
<para>
|
||||
To avoid allocating extremely large amounts of data, you can
|
||||
allocate a small array initially and grow it as you read more
|
||||
data, implementing an exponential growth policy. See the
|
||||
<function>readBytes(InputStream, int)</function> function in
|
||||
<xref linkend="ex-Defensive_Coding-Java-Language-ReadArray"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-Language-ReadArray">
|
||||
<title>Incrementally reading a byte array</title>
|
||||
<xi:include href="snippets/Java-Language-ReadArray.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
When reading data into arrays, hash maps or hash sets, use the
|
||||
default constructor and do not specify a size hint. You can
|
||||
simply add the elements to the collection as you read them.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Language-Resources">
|
||||
<title>Resource Management</title>
|
||||
<para>
|
||||
Unlike C++, Java does not offer destructors which can deallocate
|
||||
resources in a predictable fashion. All resource management has
|
||||
to be manual, at the usage site. (Finalizers are generally not
|
||||
usable for resource management, especially in high-performance
|
||||
code; see <xref
|
||||
linkend="sect-Defensive_Coding-Java-Language-Finalizers"/>.)
|
||||
</para>
|
||||
<para>
|
||||
The first option is the
|
||||
<literal>try</literal>-<literal>finally</literal> construct, as
|
||||
shown in <xref linkend="ex-Defensive_Coding-Java-Language-Finally"/>.
|
||||
The code in the <literal>finally</literal> block should be as short as
|
||||
possible and should not throw any exceptions.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-Language-Finally">
|
||||
<title>Resource management with a
|
||||
<literal>try</literal>-<literal>finally</literal> block</title>
|
||||
<xi:include href="snippets/Java-Finally.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Note that the resource allocation happens
|
||||
<emphasis>outside</emphasis> the <literal>try</literal> block,
|
||||
and that there is no <literal>null</literal> check in the
|
||||
<literal>finally</literal> block. (Both are common artifacts
|
||||
stemming from IDE code templates.)
|
||||
</para>
|
||||
<para>
|
||||
If the resource object is created freshly and implements the
|
||||
<literal>java.lang.AutoCloseable</literal> interface, the code
|
||||
in <xref
|
||||
linkend="ex-Defensive_Coding-Java-Language-TryWithResource"/> can be
|
||||
used instead. The Java compiler will automatically insert the
|
||||
<function>close()</function> method call in a synthetic
|
||||
<literal>finally</literal> block.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-Language-TryWithResource">
|
||||
<title>Resource management using the
|
||||
<literal>try</literal>-with-resource construct</title>
|
||||
<xi:include href="snippets/Java-TryWithResource.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
To be compatible with the <literal>try</literal>-with-resource
|
||||
construct, new classes should name the resource deallocation
|
||||
method <function>close()</function>, and implement the
|
||||
<literal>AutoCloseable</literal> interface (the latter breaking
|
||||
backwards compatibility with Java 6). However, using the
|
||||
<literal>try</literal>-with-resource construct with objects that
|
||||
are not freshly allocated is at best awkward, and an explicit
|
||||
<literal>finally</literal> block is usually the better approach.
|
||||
</para>
|
||||
<para>
|
||||
In general, it is best to design the programming interface in
|
||||
such a way that resource deallocation methods like
|
||||
<function>close()</function> cannot throw any (checked or
|
||||
unchecked) exceptions, but this should not be a reason to ignore
|
||||
any actual error conditions.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Language-Finalizers">
|
||||
<title>Finalizers</title>
|
||||
<para>
|
||||
Finalizers can be used a last-resort approach to free resources
|
||||
which would otherwise leak. Finalization is unpredictable,
|
||||
costly, and there can be a considerable delay between the last
|
||||
reference to an object going away and the execution of the
|
||||
finalizer. Generally, manual resource management is required;
|
||||
see <xref linkend="sect-Defensive_Coding-Java-Language-Resources"/>.
|
||||
</para>
|
||||
<para>
|
||||
Finalizers should be very short and should only deallocate
|
||||
native or other external resources held directly by the object
|
||||
being finalized. In general, they must use synchronization:
|
||||
Finalization necessarily happens on a separate thread because it is
|
||||
inherently concurrent. There can be multiple finalization
|
||||
threads, and despite each object being finalized at most once,
|
||||
the finalizer must not assume that it has exclusive access to
|
||||
the object being finalized (in the <literal>this</literal>
|
||||
pointer).
|
||||
</para>
|
||||
<para>
|
||||
Finalizers should not deallocate resources held by other
|
||||
objects, especially if those objects have finalizers on their
|
||||
own. In particular, it is a very bad idea to define a finalizer
|
||||
just to invoke the resource deallocation method of another object,
|
||||
or overwrite some pointer fields.
|
||||
</para>
|
||||
<para>
|
||||
Finalizers are not guaranteed to run at all. For instance, the
|
||||
virtual machine (or the machine underneath) might crash,
|
||||
preventing their execution.
|
||||
</para>
|
||||
<para>
|
||||
Objects with finalizers are garbage-collected much later than
|
||||
objects without them, so using finalizers to zero out key
|
||||
material (to reduce its undecrypted lifetime in memory) may have
|
||||
the opposite effect, keeping objects around for much longer and
|
||||
prevent them from being overwritten in the normal course of
|
||||
program execution.
|
||||
</para>
|
||||
<para>
|
||||
For the same reason, code which allocates objects with
|
||||
finalizers at a high rate will eventually fail (likely with a
|
||||
<literal>java.lang.OutOfMemoryError</literal> exception) because
|
||||
the virtual machine has finite resources for keeping track of
|
||||
objects pending finalization. To deal with that, it may be
|
||||
necessary to recycle objects with finalizers.
|
||||
</para>
|
||||
<para>
|
||||
The remarks in this section apply to finalizers which are
|
||||
implemented by overriding the <function>finalize()</function>
|
||||
method, and to custom finalization using reference queues.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Language-Exceptions">
|
||||
<title>Recovering from Exceptions and Errors</title>
|
||||
<para>
|
||||
Java exceptions come in three kinds, all ultimately deriving
|
||||
from <literal>java.lang.Throwable</literal>:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<emphasis>Run-time exceptions</emphasis> do not have to be
|
||||
declared explicitly and can be explicitly thrown from any
|
||||
code, by calling code which throws them, or by triggering an
|
||||
error condition at run time, like division by zero, or an
|
||||
attempt at an out-of-bounds array access. These exceptions
|
||||
derive from from the
|
||||
<literal>java.lang.RuntimeException</literal> class (perhaps
|
||||
indirectly).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<emphasis>Checked exceptions</emphasis> have to be declared
|
||||
explicitly by functions that throw or propagate them. They
|
||||
are similar to run-time exceptions in other regards, except
|
||||
that there is no language construct to throw them (except
|
||||
the <literal>throw</literal> statement itself). Checked
|
||||
exceptions are only present at the Java language level and
|
||||
are only enforced at compile time. At run time, the virtual
|
||||
machine does not know about them and permits throwing
|
||||
exceptions from any code. Checked exceptions must derive
|
||||
(perhaps indirectly) from the
|
||||
<literal>java.lang.Exception</literal> class, but not from
|
||||
<literal>java.lang.RuntimeException</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<emphasis>Errors</emphasis> are exceptions which typically
|
||||
reflect serious error conditions. They can be thrown at any
|
||||
point in the program, and do not have to be declared (unlike
|
||||
checked exceptions). In general, it is not possible to
|
||||
recover from such errors; more on that below, in <xref
|
||||
linkend="sect-Defensive_Coding-Java-Language-Exceptions-Errors"/>.
|
||||
Error classes derive (perhaps indirectly) from
|
||||
<literal>java.lang.Error</literal>, or from
|
||||
<literal>java.lang.Throwable</literal>, but not from
|
||||
<literal>java.lang.Exception</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
|
||||
<para>
|
||||
The general expection is that run-time errors are avoided by
|
||||
careful programming (e.g., not dividing by zero). Checked
|
||||
exception are expected to be caught as they happen (e.g., when
|
||||
an input file is unexpectedly missing). Errors are impossible
|
||||
to predict and can happen at any point and reflect that
|
||||
something went wrong beyond all expectations.
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Language-Exceptions-Errors">
|
||||
<title>The Difficulty of Catching Errors</title>
|
||||
<para>
|
||||
Errors (that is, exceptions which do not (indirectly) derive
|
||||
from <literal>java.lang.Exception</literal>), have the
|
||||
peculiar property that catching them is problematic. There
|
||||
are several reasons for this:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The error reflects a failed consistenty check, for example,
|
||||
<literal>java.lang.AssertionError</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The error can happen at any point, resulting in
|
||||
inconsistencies due to half-updated objects. Examples are
|
||||
<literal>java.lang.ThreadDeath</literal>,
|
||||
<literal>java.lang.OutOfMemoryError</literal> and
|
||||
<literal>java.lang.StackOverflowError</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The error indicates that virtual machine failed to provide
|
||||
some semantic guarantees by the Java programming language.
|
||||
<literal>java.lang.ExceptionInInitializerError</literal>
|
||||
is an example—it can leave behind a half-initialized
|
||||
class.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
In general, if an error is thrown, the virtual machine should
|
||||
be restarted as soon as possible because it is in an
|
||||
inconsistent state. Continuing running as before can have
|
||||
unexpected consequences. However, there are legitimate
|
||||
reasons for catching errors because not doing so leads to even
|
||||
greater problems.
|
||||
</para>
|
||||
<para>
|
||||
Code should be written in a way that avoids triggering errors.
|
||||
See <xref linkend="sect-Defensive_Coding-Java-Language-ReadArray"/>
|
||||
for an example.
|
||||
</para>
|
||||
<para>
|
||||
It is usually necessary to log errors. Otherwise, no trace of
|
||||
the problem might be left anywhere, making it very difficult
|
||||
to diagnose realted failures. Consequently, if you catch
|
||||
<literal>java.lang.Exception</literal> to log and suppress all
|
||||
unexpected exceptions (for example, in a request dispatching
|
||||
loop), you should consider switching to
|
||||
<literal>java.lang.Throwable</literal> instead, to also cover
|
||||
errors.
|
||||
</para>
|
||||
<para>
|
||||
The other reason mainly applies to such request dispatching
|
||||
loops: If you do not catch errors, the loop stops looping,
|
||||
resulting in a denial of service.
|
||||
</para>
|
||||
<para>
|
||||
However, if possible, catching errors should be coupled with a
|
||||
way to signal the requirement of a virtual machine restart.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
</section>
|
||||
|
|
@ -1,157 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-Java-LowLevel">
|
||||
<title>Low-level Features of the Virtual Machine</title>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-Reflection">
|
||||
<title><literal>Reflection and Private Parts</literal></title>
|
||||
<para>
|
||||
The <function>setAccessible(boolean)</function> method of the
|
||||
<literal>java.lang.reflect.AccessibleObject</literal> class
|
||||
allows a program to disable language-defined access rules for
|
||||
specific constructors, methods, or fields. Once the access
|
||||
checks are disabled, any code can use the
|
||||
<literal>java.lang.reflect.Constructor</literal>,
|
||||
<literal>java.lang.reflect.Method</literal>, or
|
||||
<literal>java.lang.reflect.Field</literal> object to access the
|
||||
underlying Java entity, without further permission checks. This
|
||||
breaks encapsulation and can undermine the stability of the
|
||||
virtual machine. (In contrast, without using the
|
||||
<function>setAccessible(boolean)</function> method, this should
|
||||
not happen because all the language-defined checks still apply.)
|
||||
</para>
|
||||
<para>
|
||||
This feature should be avoided if possible.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-JNI">
|
||||
<title>Java Native Interface (JNI)</title>
|
||||
<para>
|
||||
The Java Native Interface allows calling from Java code
|
||||
functions specifically written for this purpose, usually in C or
|
||||
C++.
|
||||
</para>
|
||||
<para>
|
||||
The transition between the Java world and the C world is not
|
||||
fully type-checked, and the C code can easily break the Java
|
||||
virtual machine semantics. Therefore, extra care is needed when
|
||||
using this functionality.
|
||||
</para>
|
||||
<para>
|
||||
To provide a moderate amount of type safety, it is recommended
|
||||
to recreate the class-specific header file using
|
||||
<application>javah</application> during the build process,
|
||||
include it in the implementation, and use the
|
||||
<option>-Wmissing-declarations</option> option.
|
||||
</para>
|
||||
<para>
|
||||
Ideally, the required data is directly passed to static JNI
|
||||
methods and returned from them, and the code and the C side does
|
||||
not have to deal with accessing Java fields (or even methods).
|
||||
</para>
|
||||
<para>
|
||||
When using <function>GetPrimitiveArrayCritical</function> or
|
||||
<function>GetStringCritical</function>, make sure that you only
|
||||
perform very little processing between the get and release
|
||||
operations. Do not access the file system or the network, and
|
||||
not perform locking, because that might introduce blocking.
|
||||
When processing large strings or arrays, consider splitting the
|
||||
computation into multiple sub-chunks, so that you do not prevent
|
||||
the JVM from reaching a safepoint for extended periods of time.
|
||||
</para>
|
||||
<para>
|
||||
If necessary, you can use the Java <literal>long</literal> type
|
||||
to store a C pointer in a field of a Java class. On the C side,
|
||||
when casting between the <literal>jlong</literal> value and the
|
||||
pointer on the C side,
|
||||
</para>
|
||||
<para>
|
||||
You should not try to perform pointer arithmetic on the Java
|
||||
side (that is, you should treat pointer-carrying
|
||||
<literal>long</literal> values as opaque). When passing a slice
|
||||
of an array to the native code, follow the Java convention and
|
||||
pass it as the base array, the integer offset of the start of
|
||||
the slice, and the integer length of the slice. On the native
|
||||
side, check the offset/length combination against the actual
|
||||
array length, and use the offset to compute the pointer to the
|
||||
beginning of the array.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-JNI-Pointers">
|
||||
<title>Array length checking in JNI code</title>
|
||||
<xi:include href="snippets/Java-JNI-Pointers.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
In any case, classes referring to native resources must be
|
||||
declared <literal>final</literal>, and must not be serializeable
|
||||
or cloneable. Initialization and mutation of the state used by
|
||||
the native side must be controlled carefully. Otherwise, it
|
||||
might be possible to create an object with inconsistent native
|
||||
state which results in a crash (or worse) when used (or perhaps
|
||||
only finalized) later. If you need both Java inheritance and
|
||||
native resources, you should consider moving the native state to
|
||||
a separate class, and only keep a reference to objects of that
|
||||
class. This way, cloning and serialization issues can be
|
||||
avoided in most cases.
|
||||
</para>
|
||||
<para>
|
||||
If there are native resources associated with an object, the
|
||||
class should have an explicit resource deallocation method
|
||||
(<xref
|
||||
linkend="sect-Defensive_Coding-Java-Language-Resources"/>) and a
|
||||
finalizer (<xref
|
||||
linkend="sect-Defensive_Coding-Java-Language-Finalizers"/>) as a
|
||||
last resort. The need for finalization means that a minimum
|
||||
amount of synchronization is needed. Code on the native side
|
||||
should check that the object is not in a closed/freed state.
|
||||
</para>
|
||||
<para>
|
||||
Many JNI functions create local references. By default, these
|
||||
persist until the JNI-implemented method returns. If you create
|
||||
many such references (e.g., in a loop), you may have to free
|
||||
them using <function>DeleteLocalRef</function>, or start using
|
||||
<function>PushLocalFrame</function> and
|
||||
<function>PopLocalFrame</function>. Global references must be
|
||||
deallocated with <function>DeleteGlobalRef</function>, otherwise
|
||||
there will be a memory leak, just as with
|
||||
<function>malloc</function> and <function>free</function>.
|
||||
</para>
|
||||
<para>
|
||||
When throwing exceptions using <function>Throw</function> or
|
||||
<function>ThrowNew</function>, be aware that these functions
|
||||
return regularly. You have to return control manually to the
|
||||
JVM.
|
||||
</para>
|
||||
<para>
|
||||
Technically, the <literal>JNIEnv</literal> pointer is not
|
||||
necessarily constant during the lifetime of your JNI module.
|
||||
Storing it in a global variable is therefore incorrect.
|
||||
Particularly if you are dealing with callbacks, you may have to
|
||||
store the pointer in a thread-local variable (defined with
|
||||
<literal>__thread</literal>). It is, however, best to avoid the
|
||||
complexity of calling back into Java code.
|
||||
</para>
|
||||
<para>
|
||||
Keep in mind that C/C++ and Java are different languages,
|
||||
despite very similar syntax for expressions. The Java memory
|
||||
model is much more strict than the C or C++ memory models, and
|
||||
native code needs more synchronization, usually using JVM
|
||||
facilities or POSIX threads mutexes. Integer overflow in Java
|
||||
is defined, but in C/C++ it is not (for the
|
||||
<literal>jint</literal> and <literal>jlong</literal> types).
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-MiscUnsafe">
|
||||
<title><literal>sun.misc.Unsafe</literal></title>
|
||||
<para>
|
||||
The <literal>sun.misc.Unsafe</literal> class is unportable and
|
||||
contains many functions explicitly designed to break Java memory
|
||||
safety (for performance and debugging). If possible, avoid
|
||||
using this class.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
</section>
|
|
@ -1,292 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<section id="sect-Defensive_Coding-Java-SecurityManager">
|
||||
<title>Interacting with the Security Manager</title>
|
||||
<para>
|
||||
The Java platform is largely implemented in the Java language
|
||||
itself. Therefore, within the same JVM, code runs which is part
|
||||
of the Java installation and which is trusted, but there might
|
||||
also be code which comes from untrusted sources and is restricted
|
||||
by the Java sandbox (to varying degrees). The <emphasis>security
|
||||
manager</emphasis> draws a line between fully trusted, partially
|
||||
trusted and untrusted code.
|
||||
</para>
|
||||
<para>
|
||||
The type safety and accessibility checks provided by the Java
|
||||
language and JVM would be sufficient to implement a sandbox.
|
||||
However, only some Java APIs employ such a capabilities-based
|
||||
approach. (The Java SE library contains many public classes with
|
||||
public constructors which can break any security policy, such as
|
||||
<literal>java.io.FileOutputStream</literal>.) Instead, critical
|
||||
functionality is protected by <emphasis>stack
|
||||
inspection</emphasis>: At a security check, the stack is walked
|
||||
from top (most-nested) to bottom. The security check fails if a
|
||||
stack frame for a method is encountered whose class lacks the
|
||||
permission which the security check requires.
|
||||
</para>
|
||||
<para>
|
||||
This simple approach would not allow untrusted code (which lacks
|
||||
certain permissions) to call into trusted code while the latter
|
||||
retains trust. Such trust transitions are desirable because they
|
||||
enable Java as an implementation language for most parts of the
|
||||
Java platform, including security-relevant code. Therefore, there
|
||||
is a mechanism to mark certain stack frames as trusted (<xref
|
||||
linkend="sect-Defensive_Coding-Java-SecurityManager-Privileged"/>).
|
||||
</para>
|
||||
<para>
|
||||
In theory, it is possible to run a Java virtual machine with a
|
||||
security manager that acts very differently from this approach,
|
||||
but a lot of code expects behavior very close to the platform
|
||||
default (including many classes which are part of the OpenJDK
|
||||
implementation).
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-SecurityManager-Compatible">
|
||||
<title>Security Manager Compatibility</title>
|
||||
<para>
|
||||
A lot of code can run without any additional permissions at all,
|
||||
with little changes. The following guidelines should help to
|
||||
increase compatibility with a restrictive security manager.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
When retrieving system properties using
|
||||
<function>System.getProperty(String)</function> or similar
|
||||
methods, catch <literal>SecurityException</literal>
|
||||
exceptions and treat the property as unset.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Avoid unnecessary file system or network access.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Avoid explicit class loading. Access to a suitable class
|
||||
loader might not be available when executing as untrusted
|
||||
code.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
If the functionality you are implementing absolutely requires
|
||||
privileged access and this functionality has to be used from
|
||||
untrusted code (hopefully in a restricted and secure manner),
|
||||
see <xref
|
||||
linkend="sect-Defensive_Coding-Java-SecurityManager-Privileged"/>.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-SecurityManager-Activate">
|
||||
<title>Activating the Security Manager</title>
|
||||
<para>
|
||||
The usual command to launch a Java application,
|
||||
<command>java</command>, does not activate the security manager.
|
||||
Therefore, the virtual machine does not enforce any sandboxing
|
||||
restrictions, even if explicitly requested by the code (for
|
||||
example, as described in <xref
|
||||
linkend="sect-Defensive_Coding-Java-SecurityManager-Unprivileged"/>).
|
||||
</para>
|
||||
<para>
|
||||
The <option>-Djava.security.manager</option> option activates
|
||||
the security manager, with the fairly restrictive default
|
||||
policy. With a very permissive policy, most Java code will run
|
||||
unchanged. Assuming the policy in <xref
|
||||
linkend="ex-Defensive_Coding-Java-SecurityManager-GrantAll"/>
|
||||
has been saved in a file <filename>grant-all.policy</filename>,
|
||||
this policy can be activated using the option
|
||||
<option>-Djava.security.policy=grant-all.policy</option> (in
|
||||
addition to the <option>-Djava.security.manager</option>
|
||||
option).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-SecurityManager-GrantAll">
|
||||
<title>Most permissve OpenJDK policy file</title>
|
||||
<programlisting>
|
||||
grant {
|
||||
permission java.security.AllPermission;
|
||||
};
|
||||
</programlisting>
|
||||
</example>
|
||||
<para>
|
||||
With this most permissive policy, the security manager is still
|
||||
active, and explicit requests to drop privileges will be
|
||||
honored.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-SecurityManager-Unprivileged">
|
||||
<title>Reducing Trust in Code</title>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Java-SecurityManager-Unprivileged"/>
|
||||
shows how to run a piece code of with reduced privileges.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-SecurityManager-Unprivileged">
|
||||
<title>Using the security manager to run code with reduced
|
||||
privileges</title>
|
||||
<xi:include href="snippets/Java-SecurityManager-Unprivileged.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The example above does not add any additional permissions to the
|
||||
<literal>permissions</literal> object. If such permissions are
|
||||
necessary, code like the following (which grants read permission
|
||||
on all files in the current directory) can be used:
|
||||
</para>
|
||||
<informalexample>
|
||||
<xi:include href="snippets/Java-SecurityManager-CurrentDirectory.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</informalexample>
|
||||
<important>
|
||||
<para>
|
||||
Calls to the
|
||||
<function>java.security.AccessController.doPrivileged()</function>
|
||||
methods do not enforce any additional restriction if no
|
||||
security manager has been set. Except for a few special
|
||||
exceptions, the restrictions no longer apply if the
|
||||
<function>doPrivileged()</function> has returned, even to
|
||||
objects created by the code which ran with reduced privileges.
|
||||
(This applies to object finalization in particular.)
|
||||
</para>
|
||||
<para>
|
||||
The example code above does not prevent the called code from
|
||||
calling the
|
||||
<function>java.security.AccessController.doPrivileged()</function>
|
||||
methods. This mechanism should be considered an additional
|
||||
safety net, but it still can be used to prevent unexpected
|
||||
behavior of trusted code. As long as the executed code is not
|
||||
dynamic and came with the original application or library, the
|
||||
sandbox is fairly effective.
|
||||
</para>
|
||||
<para>
|
||||
The <literal>context</literal> argument in <xref
|
||||
linkend="ex-Defensive_Coding-Java-SecurityManager-Unprivileged"/>
|
||||
is extremely important—otherwise, this code would increase
|
||||
privileges instead of reducing them.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
For activating the security manager, see <xref
|
||||
linkend="sect-Defensive_Coding-Java-SecurityManager-Activate"/>.
|
||||
Unfortunately, this affects the virtual machine as a whole, so
|
||||
it is not possible to do this from a library.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Java-SecurityManager-Privileged">
|
||||
<title>Re-gaining Privileges</title>
|
||||
<para>
|
||||
Ordinarily, when trusted code is called from untrusted code, it
|
||||
loses its privileges (because of the untrusted stack frames
|
||||
visible to stack inspection). The
|
||||
<function>java.security.AccessController.doPrivileged()</function>
|
||||
family of methods provides a controlled backdoor from untrusted
|
||||
to trusted code.
|
||||
</para>
|
||||
<important>
|
||||
<para>
|
||||
By design, this feature can undermine the Java security model
|
||||
and the sandbox. It has to be used very carefully. Most
|
||||
sandbox vulnerabilities can be traced back to its misuse.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
In essence, the <function>doPrivileged()</function> methods
|
||||
cause the stack inspection to end at their call site. Untrusted
|
||||
code further down the call stack becomes invisible to security
|
||||
checks.
|
||||
</para>
|
||||
<para>
|
||||
The following operations are common and safe to perform with
|
||||
elevated privileges.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Reading custom system properties with fixed names,
|
||||
especially if the value is not propagated to untrusted code.
|
||||
(File system paths including installation paths, host names
|
||||
and user names are sometimes considered private information
|
||||
and need to be protected.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Reading from the file system at fixed paths, either
|
||||
determined at compile time or by a system property. Again,
|
||||
leaking the file contents to the caller can be problematic.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Accessing network resources under a fixed address, name or
|
||||
URL, derived from a system property or configuration file,
|
||||
information leaks not withstanding.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Java-SecurityManager-Privileged"/>
|
||||
shows how to request additional privileges.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-SecurityManager-Privileged">
|
||||
<title>Using the security manager to run code with increased
|
||||
privileges</title>
|
||||
<xi:include href="snippets/Java-SecurityManager-Privileged.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Obviously, this only works if the class containing the call to
|
||||
<function>doPrivileged()</function> is marked trusted (usually
|
||||
because it is loaded from a trusted class loader).
|
||||
</para>
|
||||
<para>
|
||||
When writing code that runs with elevated privileges, make sure
|
||||
that you follow the rules below.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Make the privileged code as small as possible. Perform as
|
||||
many computations as possible before and after the
|
||||
privileged code section, even if it means that you have to
|
||||
define a new class to pass the data around.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Make sure that you either control the inputs to the
|
||||
privileged code, or that the inputs are harmless and cannot
|
||||
affect security properties of the privileged code.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Data that is returned from or written by the privileged code
|
||||
must either be restricted (that is, it cannot be accessed by
|
||||
untrusted code), or must be harmless. Otherwise, privacy
|
||||
leaks or information disclosures which affect security
|
||||
properties can be the result.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
If the code calls back into untrusted code at a later stage (or
|
||||
performs other actions under control from the untrusted caller),
|
||||
you must obtain the original security context and restore it
|
||||
before performing the callback, as in <xref
|
||||
linkend="ex-Defensive_Coding-Java-SecurityManager-Callback"/>.
|
||||
(In this example, it would be much better to move the callback
|
||||
invocation out of the privileged code section, of course.)
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Java-SecurityManager-Callback">
|
||||
<title>Restoring privileges when invoking callbacks</title>
|
||||
<xi:include href="snippets/Java-SecurityManager-Callback.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
|
||||
</section>
|
||||
|
|
@ -1,11 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Java">
|
||||
<title>The Java Programming Language</title>
|
||||
|
||||
<xi:include href="Java-Language.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Java-LowLevel.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
<xi:include href="Java-SecurityManager.xml" xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</chapter>
|
||||
|
|
@ -1,74 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Python">
|
||||
<title>The Python Programming Language</title>
|
||||
<para>
|
||||
Python provides memory safety by default, so low-level security
|
||||
vulnerabilities are rare and typically needs fixing the Python
|
||||
interpreter or standard library itself.
|
||||
</para>
|
||||
<para>
|
||||
Other sections with Python-specific advice include:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<xref linkend="chap-Defensive_Coding-Tasks-Temporary_Files"/>
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-Processes-Creation"/>
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<xref linkend="chap-Defensive_Coding-Tasks-Serialization"/>, in
|
||||
particular <xref linkend="sect-Defensive_Coding-Tasks-Serialization-Library"/>
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-Cryptography-Randomness"/>
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<section>
|
||||
<title>Dangerous Standard Library Features</title>
|
||||
<para>
|
||||
Some areas of the standard library, notably the
|
||||
<literal>ctypes</literal> module, do not provide memory safety
|
||||
guarantees comparable to the rest of Python. If such
|
||||
functionality is used, the advice in <xref
|
||||
linkend="sect-Defensive_Coding-C-Language"/> should be followed.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Run-time Compilation and Code Generation</title>
|
||||
<para>
|
||||
The following Python functions and statements related to code
|
||||
execution should be avoided:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para><function>compile</function></para></listitem>
|
||||
<listitem><para><function>eval</function></para></listitem>
|
||||
<listitem><para><literal>exec</literal></para></listitem>
|
||||
<listitem><para><function>execfile</function></para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
If you need to parse integers or floating point values, use the
|
||||
<function>int</function> and <function>float</function>
|
||||
functions instead of <function>eval</function>. Sandboxing
|
||||
untrusted Python code does not work reliably.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Sandboxing</title>
|
||||
<para>
|
||||
The <literal>rexec</literal> Python module cannot safely sandbox
|
||||
untrusted code and should not be used. The standard CPython
|
||||
implementation is not suitable for sandboxing.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,96 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE appendix PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
<!ENTITY % BOOK_ENTITIES SYSTEM "Defensive_Coding.ent">
|
||||
%BOOK_ENTITIES;
|
||||
]>
|
||||
<appendix id="appe-Defensive_Coding-Revision_History">
|
||||
<title>Revision History</title>
|
||||
<simpara>
|
||||
<revhistory>
|
||||
<revision>
|
||||
<revnumber>1.3-1</revnumber>
|
||||
<date>Mon Oct 13 2014</date>
|
||||
<author>
|
||||
<firstname>Florian</firstname>
|
||||
<surname>Weimer</surname>
|
||||
<email>fweimer@redhat.com</email>
|
||||
</author>
|
||||
<revdescription>
|
||||
<simplelist>
|
||||
<member>Go: Mention default value handling in deserialization</member>
|
||||
<member>Shell: New chapter</member>
|
||||
</simplelist>
|
||||
</revdescription>
|
||||
</revision>
|
||||
<revision>
|
||||
<revnumber>1.2-1</revnumber>
|
||||
<date>Wed Jul 16 2014</date>
|
||||
<author>
|
||||
<firstname>Florian</firstname>
|
||||
<surname>Weimer</surname>
|
||||
<email>fweimer@redhat.com</email>
|
||||
</author>
|
||||
<revdescription>
|
||||
<simplelist>
|
||||
<member>C: Corrected the <function>strncat</function> example</member>
|
||||
<member>C: Mention mixed signed/unsigned comparisons</member>
|
||||
<member>C: Unsigned overflow checking example</member>
|
||||
<member>C++: <literal>operator new[]</literal> has been fixed in GCC</member>
|
||||
<member>C++: Additional material on <literal>std::string</literal>, iterators</member>
|
||||
<member>OpenSSL: Mention <command>openssl genrsa</command> entropy issue</member>
|
||||
<member>Packaging: X.509 key generation</member>
|
||||
<member>Go, Vala: Add short chapters</member>
|
||||
<member>Serialization: Notes on fragmentation and reassembly</member>
|
||||
</simplelist>
|
||||
</revdescription>
|
||||
</revision>
|
||||
<revision>
|
||||
<revnumber>1.1-1</revnumber>
|
||||
<date>Tue Aug 27 2013</date>
|
||||
<author>
|
||||
<firstname>Eric</firstname>
|
||||
<surname>Christensen</surname>
|
||||
<email>sparks@redhat.com</email>
|
||||
</author>
|
||||
<revdescription>
|
||||
<simplelist>
|
||||
<member>Add a chapter which covers some Java topics.</member>
|
||||
<member>Deserialization: Warn about Java's java.beans.XMLDecoder.</member>
|
||||
<member>C: Correct the advice on array allocation
|
||||
(<ulink url="https://bugzilla.redhat.com/show_bug.cgi?id=995595">bug 995595</ulink>).</member>
|
||||
<member>C: Add material on global variables.</member>
|
||||
</simplelist>
|
||||
</revdescription>
|
||||
</revision>
|
||||
<revision>
|
||||
<revnumber>1.0-1</revnumber>
|
||||
<date>Thu May 09 2013</date>
|
||||
<author>
|
||||
<firstname>Eric</firstname>
|
||||
<surname>Christensen</surname>
|
||||
<email>sparks@redhat.com</email>
|
||||
</author>
|
||||
<revdescription>
|
||||
<simplelist>
|
||||
<member>Added more C and C++ examples.</member>
|
||||
<member>TLS Client NSS: Rely on NSS 3.14 cipher suite defaults.</member>
|
||||
</simplelist>
|
||||
</revdescription>
|
||||
</revision>
|
||||
<revision>
|
||||
<revnumber>0-1</revnumber>
|
||||
<date>Thu Mar 7 2013</date>
|
||||
<author>
|
||||
<firstname>Eric</firstname>
|
||||
<surname>Christensen</surname>
|
||||
<email>sparks@redhat.com</email>
|
||||
</author>
|
||||
<revdescription>
|
||||
<simplelist>
|
||||
<member>Initial publication.</member>
|
||||
</simplelist>
|
||||
</revdescription>
|
||||
</revision>
|
||||
</revhistory>
|
||||
</simpara>
|
||||
</appendix>
|
454
en-US/Shell.xml
454
en-US/Shell.xml
|
@ -1,454 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Shell">
|
||||
<title>Shell Programming and <application>bash</application></title>
|
||||
<para>
|
||||
This chapter contains advice about shell programming, specifically
|
||||
in <application>bash</application>. Most of the advice will apply
|
||||
to scripts written for other shells because extensions such as
|
||||
integer or array variables have been implemented there as well, with
|
||||
comparable syntax.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Shell-Alternatives">
|
||||
<title>Consider Alternatives</title>
|
||||
<para>
|
||||
Once a shell script is so complex that advice in this chapter
|
||||
applies, it is time to step back and consider the question: Is
|
||||
there a more suitable implementation language available?
|
||||
</para>
|
||||
<para>
|
||||
For example, Python with its <literal>subprocess</literal> module
|
||||
can be used to write scripts which are almost as concise as shell
|
||||
scripts when it comes to invoking external programs, and Python
|
||||
offers richer data structures, with less arcane syntax and more
|
||||
consistent behavior.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Language">
|
||||
<title>Shell Language Features</title>
|
||||
<para>
|
||||
The following sections cover subtleties concerning the shell
|
||||
programming languages. They have been written with the
|
||||
<application>bash</application> shell in mind, but some of these
|
||||
features apply to other shells as well.
|
||||
</para>
|
||||
<para>
|
||||
Some of the features described may seem like implementation defects,
|
||||
but these features have been replicated across multiple independent
|
||||
implementations, so they now have to be considered part of the shell
|
||||
programming language.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Shell-Parameter_Expansion">
|
||||
<title>Parameter Expansion</title>
|
||||
<para>
|
||||
The mechanism by which named shell variables and parameters are
|
||||
expanded is called <emphasis>parameter expansion</emphasis>. The
|
||||
most basic syntax is
|
||||
“<literal>$</literal><emphasis>variable</emphasis>” or
|
||||
“<literal>${</literal><emphasis>variable</emphasis><literal>}</literal>”.
|
||||
</para>
|
||||
<para>
|
||||
In almost all cases, a parameter expansion should be enclosed in
|
||||
double quotation marks <literal>"</literal>…<literal>"</literal>.
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
external-program "$arg1" "$arg2"
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<para>
|
||||
If the double quotation marks are omitted, the value of the
|
||||
variable will be split according to the current value of the
|
||||
<envar>IFS</envar> variable. This may allow the injection of
|
||||
additional options which are then processed by
|
||||
<literal>external-program</literal>.
|
||||
</para>
|
||||
<para>
|
||||
Parameter expansion can use special syntax for specific features,
|
||||
such as substituting defaults or performing string or array
|
||||
operations. These constructs should not be used because they can
|
||||
trigger arithmetic evaluation, which can result in code execution.
|
||||
See <xref linkend="sect-Defensive_Coding-Shell-Arithmetic"/>.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Double_Expansion">
|
||||
<title>Double Expansion</title>
|
||||
<para>
|
||||
<emphasis>Double expansion</emphasis> occurs when, during the
|
||||
expansion of a shell variable, not just the variable is expanded,
|
||||
replacing it by its value, but the <emphasis>value</emphasis> of
|
||||
the variable is itself is expanded as well. This can trigger
|
||||
arbitrary code execution, unless the value of the variable is
|
||||
verified against a restrictive pattern.
|
||||
</para>
|
||||
<para>
|
||||
The evaluation process is in fact recursive, so a self-referential
|
||||
expression can cause an out-of-memory condition and a shell crash.
|
||||
</para>
|
||||
<para>
|
||||
Double expansion may seem like as a defect, but it is implemented
|
||||
by many shells, and has to be considered an integral part of the
|
||||
shell programming language. However, it does make writing robust
|
||||
shell scripts difficult.
|
||||
</para>
|
||||
<para>
|
||||
Double expansion can be requested explicitly with the
|
||||
<literal>eval</literal> built-in command, or by invoking a
|
||||
subshell with “<literal>bash -c</literal>”. These constructs
|
||||
should not be used.
|
||||
</para>
|
||||
<para>
|
||||
The following sections give examples of places where implicit
|
||||
double expansion occurs.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Shell-Arithmetic">
|
||||
<title>Arithmetic Evaluation</title>
|
||||
<para>
|
||||
<emphasis>Arithmetic evaluation</emphasis> is a process by which
|
||||
the shell computes the integer value of an expression specified
|
||||
as a string. It is highly problematic for two reasons: It
|
||||
triggers double expansion (see <xref
|
||||
linkend="sect-Defensive_Coding-Shell-Double_Expansion"/>), and the
|
||||
language of arithmetic expressions is not self-contained. Some
|
||||
constructs in arithmetic expressions (notably array subscripts)
|
||||
provide a trapdoor from the restricted language of arithmetic
|
||||
expressions to the full shell language, thus paving the way
|
||||
towards arbitrary code execution. Due to double expansion,
|
||||
input which is (indirectly) referenced from an arithmetic
|
||||
expression can trigger execution of arbitrary code, which is
|
||||
potentially harmful.
|
||||
</para>
|
||||
<para>
|
||||
Arithmetic evaluation is triggered by the follow constructs:
|
||||
</para>
|
||||
<!-- The list was constructed by looking at the bash sources and
|
||||
search for the string "expand_". -->
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The <emphasis>expression</emphasis> in
|
||||
“<literal>$((</literal><emphasis>expression</emphasis><literal>))</literal>”
|
||||
is evaluated. This construct is called <emphasis>arithmetic
|
||||
expansion</emphasis>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
“<literal>$[</literal><emphasis>expression</emphasis><literal>]</literal>”
|
||||
is a deprecated syntax with the same effect.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The arguments to the <literal>let</literal> shell built-in
|
||||
are evaluated.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
“<literal>((</literal><emphasis>expression</emphasis><literal>))</literal>”
|
||||
is an alternative syntax for “<literal>let
|
||||
</literal><emphasis>expression</emphasis>”.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Conditional expressions surrounded by
|
||||
“<literal>[[</literal>…<literal>]]</literal>” can trigger
|
||||
arithmetic evaluation if certain operators such as
|
||||
<literal>-eq</literal> are used. (The
|
||||
<literal>test</literal> built-in does not perform arithmetic
|
||||
evaluation, even with integer operators such as
|
||||
<literal>-eq</literal>.)
|
||||
</para>
|
||||
<para>
|
||||
The conditional expression
|
||||
“<literal>[[ $</literal><emphasis>variable</emphasis><literal> =~ </literal><emphasis>regexp</emphasis><literal> ]]</literal>”
|
||||
can be used for input validation, assuming that
|
||||
<emphasis>regexp</emphasis> is a constant regular
|
||||
expression.
|
||||
See <xref linkend="sect-Defensive_Coding-Shell-Input_Validation"/>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Certain parameter expansions, for example
|
||||
“<literal>${</literal><emphasis>variable</emphasis><literal>[</literal><emphasis>expression</emphasis><literal>]}</literal>”
|
||||
(array indexing) or
|
||||
“<literal>${</literal><emphasis>variable</emphasis><literal>:</literal><emphasis>expression</emphasis><literal>}</literal>”
|
||||
(string slicing), trigger arithmetic evaluation of
|
||||
<emphasis>expression</emphasis>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Assignment to array elements using
|
||||
“<emphasis>array_variable</emphasis><literal>[</literal><emphasis>subscript</emphasis><literal>]=</literal><emphasis>expression</emphasis>”
|
||||
triggers evaluation of <emphasis>subscript</emphasis>, but
|
||||
not <emphasis>expression</emphasis>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The expressions in the arithmetic <literal>for</literal>
|
||||
command,
|
||||
“<literal>for ((</literal><emphasis>expression1</emphasis><literal>; </literal><emphasis>expression2</emphasis><literal>; </literal><emphasis>expression3</emphasis><literal>)); do </literal><emphasis>commands</emphasis><literal>; done</literal>”
|
||||
are evaluated. This does not apply to the regular
|
||||
for command,
|
||||
“<literal>for </literal><emphasis>variable</emphasis><literal> in </literal><emphasis>list</emphasis><literal>; do </literal><emphasis>commands</emphasis><literal>; done</literal>”.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<important>
|
||||
<para>
|
||||
Depending on the <application>bash</application> version, the
|
||||
above list may be incomplete.
|
||||
</para>
|
||||
<para>
|
||||
If faced with a situation where using such shell features
|
||||
appears necessary, see <xref
|
||||
linkend="sect-Defensive_Coding-Shell-Alternatives"/>.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
If it is impossible to avoid shell arithmetic on untrusted
|
||||
inputs, refer to <xref
|
||||
linkend="sect-Defensive_Coding-Shell-Input_Validation"/>.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Types">
|
||||
<title>Type declarations</title>
|
||||
<para>
|
||||
<application>bash</application> supports explicit type
|
||||
declarations for shell variables:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
declare -i integer_variable
|
||||
declare -a array_variable
|
||||
declare -A assoc_array_variable
|
||||
|
||||
typeset -i integer_variable
|
||||
typeset -a array_variable
|
||||
typeset -A assoc_array_variable
|
||||
|
||||
local -i integer_variable
|
||||
local -a array_variable
|
||||
local -A assoc_array_variable
|
||||
|
||||
readonly -i integer_variable
|
||||
readonly -a array_variable
|
||||
readonly -A assoc_array_variable
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<para>
|
||||
Variables can also be declared as arrays by assigning them an
|
||||
array expression, as in:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
array_variable=(1 2 3 4)
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<para>
|
||||
Some built-ins (such as <literal>mapfile</literal>) can
|
||||
implicitly create array variables.
|
||||
</para>
|
||||
<para>
|
||||
Such type declarations should not be used because assignment to
|
||||
such variables (independent of the concrete syntax used for the
|
||||
assignment) triggers arithmetic expansion (and thus double
|
||||
expansion) of the right-hand side of the assignment operation.
|
||||
See <xref linkend="sect-Defensive_Coding-Shell-Arithmetic"/>.
|
||||
</para>
|
||||
<para>
|
||||
Shell scripts which use integer or array variables should be
|
||||
rewritten in another, more suitable language. Se <xref
|
||||
linkend="sect-Defensive_Coding-Shell-Alternatives"/>.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Obscure">
|
||||
<title>Other Obscurities</title>
|
||||
<para>
|
||||
Obscure shell language features should not be used. Examples are:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Exported functions (<literal>export -f</literal> or
|
||||
<literal>declare -f</literal>).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Function names which are not valid variable names, such as
|
||||
“<literal>module::function</literal>”.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The possibility to override built-ins or external commands
|
||||
with shell functions.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Changing the value of the <envar>IFS</envar> variable to
|
||||
tokenize strings.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Invoke">
|
||||
<title>Invoking External Commands</title>
|
||||
<para>
|
||||
When passing shell variables as single command line arguments,
|
||||
they should always be surrounded by double quotes. See
|
||||
<xref linkend="sect-Defensive_Coding-Shell-Parameter_Expansion"/>.
|
||||
</para>
|
||||
<para>
|
||||
Care is required when passing untrusted values as positional
|
||||
parameters to external commands. If the value starts with a hyphen
|
||||
“<literal>-</literal>”, it may be interpreted by the external
|
||||
command as an option. Depending on the external program, a
|
||||
“<literal>--</literal>” argument stops option processing and treats
|
||||
all following arguments as positional parameters. (Double quotes
|
||||
are completely invisible to the command being invoked, so they do
|
||||
not prevent variable values from being interpreted as options.)
|
||||
</para>
|
||||
<para>
|
||||
Cleaning the environment before invoking child processes is
|
||||
difficult to implement in script. <application>bash</application>
|
||||
keeps a hidden list of environment variables which do not correspond
|
||||
to shell variables, and unsetting them from within a
|
||||
<application>bash</application> script is not possible. To reset
|
||||
the environment, a script can re-run itself under the “<literal>env
|
||||
-i</literal>” command with an additional parameter which indicates
|
||||
the environment has been cleared and suppresses a further
|
||||
self-execution. Alternatively, individual commands can be executed
|
||||
with “<literal>env -i</literal>”.
|
||||
</para>
|
||||
<important>
|
||||
<para>
|
||||
Complete isolation from its original execution environment
|
||||
(which is required when the script is executed after a trust
|
||||
transition, e.g., triggered by the SUID mechanism) is impossible
|
||||
to achieve from within the shell script itself. Instead, the
|
||||
invoking process has to clear the process environment (except for
|
||||
few trusted variables) before running the shell script.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
Checking for failures in executed external commands is recommended.
|
||||
If no elaborate error recovery is needed, invoking “<literal>set
|
||||
-e</literal>” may be sufficient. This causes the script to stop on
|
||||
the first failed command. However, failures in pipes
|
||||
(“<literal>command1 | command2</literal>”) are only detected for the
|
||||
last command in the pipe, errors in previous commands are ignored.
|
||||
This can be changed by invoking “<literal>set -o pipefail</literal>”.
|
||||
Due to architectural limitations, only the process that spawned
|
||||
the entire pipe can check for failures in individual commands;
|
||||
it is not possible for a process to tell if the process feeding
|
||||
data (or the process consuming data) exited normally or with
|
||||
an error.
|
||||
</para>
|
||||
<para>
|
||||
See <xref linkend="sect-Defensive_Coding-Tasks-Processes-Creation"/>
|
||||
for additional details on creating child processes.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Temporary_Files">
|
||||
<title>Temporary Files</title>
|
||||
<para>
|
||||
Temporary files should be created with the
|
||||
<literal>mktemp</literal> command, and temporary directories with
|
||||
“<literal>mktemp -d</literal>”.
|
||||
</para>
|
||||
<para>
|
||||
To clean up temporary files and directories, write a clean-up
|
||||
shell function and register it as a trap handler, as shown in
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Temporary_Files"/>.
|
||||
Using a separate function avoids issues with proper quoting of
|
||||
variables.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Temporary_Files">
|
||||
<title>Creating and Cleaning up Temporary Files</title>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
tmpfile="$(mktemp)"
|
||||
|
||||
cleanup () {
|
||||
rm -f -- "$tmpfile"
|
||||
}
|
||||
|
||||
trap cleanup 0
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Input_Validation">
|
||||
<title>Performing Input Validation</title>
|
||||
<para>
|
||||
In some cases, input validation cannot be avoided. For example,
|
||||
if arithmetic evaluation is absolutely required, it is imperative
|
||||
to check that input values are, in fact, integers. See <xref
|
||||
linkend="sect-Defensive_Coding-Shell-Arithmetic"/>.
|
||||
</para>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Shell-Input_Validation"/>
|
||||
shows a construct which can be used to check if a string
|
||||
“<literal>$value</literal>” is an integer. This construct is
|
||||
specific to <application>bash</application> and not portable to
|
||||
POSIX shells.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Shell-Input_Validation">
|
||||
<title>Input validation in <application>bash</application></title>
|
||||
<xi:include href="snippets/Shell-Input_Validation.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Using <literal>case</literal> statements for input validation is
|
||||
also possible and supported by other (POSIX) shells, but the
|
||||
pattern language is more restrictive, and it can be difficult to
|
||||
write suitable patterns.
|
||||
</para>
|
||||
<para>
|
||||
The <literal>expr</literal> external command can give misleading
|
||||
results (e.g., if the value being checked contains operators
|
||||
itself) and should not be used.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Shell-Edit_Guard">
|
||||
<title>Guarding Shell Scripts Against Changes</title>
|
||||
<para>
|
||||
<application>bash</application> only reads a shell script up to
|
||||
the point it is needed for executed the next command. This means
|
||||
that if script is overwritten while it is running, execution can
|
||||
jump to a random part of the script, depending on what is modified
|
||||
in the script and how the file offsets change as a result. (This
|
||||
behavior is needed to support self-extracting shell archives whose
|
||||
script part is followed by a stream of bytes which does not follow
|
||||
the shell language syntax.)
|
||||
</para>
|
||||
<para>
|
||||
Therefore, long-running scripts should be guarded against
|
||||
concurrent modification by putting as much of the program logic
|
||||
into a <literal>main</literal> function, and invoking the
|
||||
<literal>main</literal> function at the end of the script, using
|
||||
this syntax:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="Bash">
|
||||
main "$@" ; exit $?
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<para>
|
||||
This construct ensures that <application>bash</application> will
|
||||
stop execution after the <literal>main</literal> function, instead
|
||||
of opening the script file and trying to read more commands.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,143 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-Cryptography">
|
||||
<title>Cryptography</title>
|
||||
|
||||
<section>
|
||||
<title>Primitives</title>
|
||||
<para>
|
||||
Choosing from the following cryptographic primitives is
|
||||
recommended:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>RSA with 2048 bit keys and OAEP or PSS
|
||||
padding</para></listitem>
|
||||
<listitem><para>AES-128 in CBC mode</para></listitem>
|
||||
<listitem><para>AES-128 in GCM mode</para></listitem>
|
||||
<listitem><para>AES-256 in CBC mode</para></listitem>
|
||||
<listitem><para>AES-256 in GCM mode</para></listitem>
|
||||
<listitem><para>SHA-256</para></listitem>
|
||||
<listitem><para>HMAC-SHA-256</para></listitem>
|
||||
<listitem><para>HMAC-SHA-1</para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Other cryptographic algorithms can be used if they are required
|
||||
for interoperability with existing software:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>RSA with key sizes larger than 1024
|
||||
and legacy padding</para></listitem>
|
||||
<listitem><para>AES-192</para></listitem>
|
||||
<listitem><para>3DES (triple DES, with two or three 56 bit keys),
|
||||
but strongly discouraged</para></listitem>
|
||||
<listitem><para>RC4 (but very, very strongly discouraged)</para></listitem>
|
||||
<listitem><para>SHA-1</para></listitem>
|
||||
<listitem><para>HMAC-MD5</para></listitem>
|
||||
</itemizedlist>
|
||||
<important>
|
||||
<title>Important</title>
|
||||
<para>
|
||||
These primitives are difficult to use in a secure way. Custom
|
||||
implementation of security protocols should be avoided. For
|
||||
protecting confidentiality and integrity of network
|
||||
transmissions, TLS should be used (<xref
|
||||
linkend="chap-Defensive_Coding-TLS"/>).
|
||||
</para>
|
||||
<para>
|
||||
In particular, when using AES in CBC mode, it is necessary to
|
||||
add integrity checking by other means, preferably using
|
||||
HMAC-SHA-256 and <emphasis>after</emphasis> encryption (that
|
||||
is, on the encrypted cipher text). For AES in GCM mode,
|
||||
correct construction of nonces is absolutely essential.
|
||||
</para>
|
||||
</important>
|
||||
<!-- TODO: More algorithms are available in the NIST documents
|
||||
linked from: http://wiki.brq.redhat.com/SecurityTechnologies/FIPS -->
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title id="sect-Defensive_Coding-Tasks-Cryptography-Randomness">Randomness</title>
|
||||
<para>
|
||||
The following facilities can be used to generate unpredictable
|
||||
and non-repeating values. When these functions are used without
|
||||
special safeguards, each individual random value should be at
|
||||
least 12 bytes long.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para><function>PK11_GenerateRandom</function> in the NSS library
|
||||
(usable for high data rates)</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para><function>RAND_bytes</function> in the OpenSSL library
|
||||
(usable for high data rates)</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para><function>gnutls_rnd</function> in GNUTLS, with
|
||||
<literal>GNUTLS_RND_RANDOM</literal> as the first argument
|
||||
(usable for high data rates)</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para><type>java.security.SecureRandom</type> in Java
|
||||
(usable for high data rates)</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para><function>os.urandom</function> in Python</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>The <function>getrandom</function> system call since glibc 2.25</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>The <function>getentropy</function> call since glibc 2.25</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>Reading from the <filename>/dev/urandom</filename>
|
||||
character device</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
All these functions should be non-blocking, and they should not
|
||||
wait until physical randomness becomes available. (Some
|
||||
cryptography providers for Java can cause
|
||||
<type>java.security.SecureRandom</type> to block, however.)
|
||||
Those functions which do not obtain all bits directly from
|
||||
<filename>/dev/urandom</filename> are suitable for high data
|
||||
rates because they do not deplete the system-wide entropy pool.
|
||||
</para>
|
||||
<important>
|
||||
<title>Difficult to use API</title>
|
||||
<para>
|
||||
Both <function>RAND_bytes</function> and
|
||||
<function>PK11_GenerateRandom</function> have three-state
|
||||
return values (with conflicting meanings). Careful error
|
||||
checking is required. Please review the documentation when
|
||||
using these functions.
|
||||
</para>
|
||||
</important>
|
||||
<important>
|
||||
<title>Difficult to use API</title>
|
||||
<para>
|
||||
The <function>getrandom</function> system call has three-state
|
||||
return values, hence requires careful error checking.
|
||||
</para>
|
||||
<para>
|
||||
It was introduced in Linux kernel 3.17, but before glibc 2.25 no API wrappers were
|
||||
provided. As such one could only use it via the syscall interface
|
||||
as <function>syscall(SYS_getrandom, (void*)dest, (size_t)size, (unsigned int)0)</function>.
|
||||
For portable code targetting multiple kernel versions one has to check
|
||||
for the function being available on run-time, and switch to another
|
||||
facility if the running kernel does not support this call.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
Other sources of randomness should be considered predictable.
|
||||
</para>
|
||||
<para>
|
||||
Generating randomness for cryptographic keys in long-term use
|
||||
may need different steps and is best left to cryptographic
|
||||
libraries.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
</chapter>
|
|
@ -1,267 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="sect-Defensive_Coding-Tasks-Descriptors">
|
||||
<title>File Descriptor Management</title>
|
||||
<para>
|
||||
File descriptors underlie all input/output mechanisms offered by
|
||||
the system. They are used to implementation the <literal>FILE
|
||||
*</literal>-based functions found in
|
||||
<literal><stdio.h></literal>, and all the file and network
|
||||
communication facilities provided by the Python and Java
|
||||
environments are eventually implemented in them.
|
||||
</para>
|
||||
<para>
|
||||
File descriptors are small, non-negative integers in userspace,
|
||||
and are backed on the kernel side with complicated data structures
|
||||
which can sometimes grow very large.
|
||||
</para>
|
||||
<section>
|
||||
<title>Closing Descriptors</title>
|
||||
<para>
|
||||
If a descriptor is no longer used by a program and is not closed
|
||||
explicitly, its number cannot be reused (which is problematic in
|
||||
itself, see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Descriptors-Limit"/>), and
|
||||
the kernel resources are not freed. Therefore, it is important
|
||||
to close all descriptors at the earliest point in time
|
||||
possible, but not earlier.
|
||||
</para>
|
||||
<section>
|
||||
<title>Error Handling during Descriptor Close</title>
|
||||
<para>
|
||||
The <function>close</function> system call is always
|
||||
successful in the sense that the passed file descriptor is
|
||||
never valid after the function has been called. However,
|
||||
<function>close</function> still can return an error, for
|
||||
example if there was a file system failure. But this error is
|
||||
not very useful because the absence of an error does not mean
|
||||
that all caches have been emptied and previous writes have
|
||||
been made durable. Programs which need such guarantees must
|
||||
open files with <literal>O_SYNC</literal> or use
|
||||
<literal>fsync</literal> or <literal>fdatasync</literal>, and
|
||||
may also have to <literal>fsync</literal> the directory
|
||||
containing the file.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Closing Descriptors and Race Conditions</title>
|
||||
<para>
|
||||
Unlike process IDs, which are recycle only gradually, the
|
||||
kernel always allocates the lowest unused file descriptor when
|
||||
a new descriptor is created. This means that in a
|
||||
multi-threaded program which constantly opens and closes file
|
||||
descriptors, descriptors are reused very quickly. Unless
|
||||
descriptor closing and other operations on the same file
|
||||
descriptor are synchronized (typically, using a mutex), there
|
||||
will be race conditons and I/O operations will be applied to
|
||||
the wrong file descriptor.
|
||||
</para>
|
||||
<para>
|
||||
Sometimes, it is necessary to close a file descriptor
|
||||
concurrently, while another thread might be about to use it in
|
||||
a system call. In order to support this, a program needs to
|
||||
create a single special file descriptor, one on which all I/O
|
||||
operations fail. One way to achieve this is to use
|
||||
<function>socketpair</function>, close one of the descriptors,
|
||||
and call <literal>shutdown(fd, SHUTRDWR)</literal> on the
|
||||
other.
|
||||
</para>
|
||||
<para>
|
||||
When a descriptor is closed concurrently, the program does not
|
||||
call <function>close</function> on the descriptor. Instead it
|
||||
program uses <function>dup2</function> to replace the
|
||||
descriptor to be closed with the dummy descriptor created
|
||||
earlier. This way, the kernel will not reuse the descriptor,
|
||||
but it will carry out all other steps associated with calling
|
||||
a descriptor (for instance, if the descriptor refers to a
|
||||
stream socket, the peer will be notified).
|
||||
</para>
|
||||
<para>
|
||||
This is just a sketch, and many details are missing.
|
||||
Additional data structures are needed to determine when it is
|
||||
safe to really close the descriptor, and proper locking is
|
||||
required for that.
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Lingering State after Close</title>
|
||||
<para>
|
||||
By default, closing a stream socket returns immediately, and
|
||||
the kernel will try to send the data in the background. This
|
||||
means that it is impossible to implement accurate accounting
|
||||
of network-related resource utilization from userspace.
|
||||
</para>
|
||||
<para>
|
||||
The <literal>SO_LINGER</literal> socket option alters the
|
||||
behavior of <function>close</function>, so that it will return
|
||||
only after the lingering data has been processed, either by
|
||||
sending it to the peer successfully, or by discarding it after
|
||||
the configured timeout. However, there is no interface which
|
||||
could perform this operation in the background, so a separate
|
||||
userspace thread is needed for each <function>close</function>
|
||||
call, causing scalability issues.
|
||||
</para>
|
||||
<para>
|
||||
Currently, there is no application-level countermeasure which
|
||||
applies universally. Mitigation is possible with
|
||||
<application>iptables</application> (the
|
||||
<literal>connlimit</literal> match type in particular) and
|
||||
specialized filtering devices for denial-of-service network
|
||||
traffic.
|
||||
</para>
|
||||
<para>
|
||||
These problems are not related to the
|
||||
<literal>TIME_WAIT</literal> state commonly seen in
|
||||
<application>netstat</application> output. The kernel
|
||||
automatically expires such sockets if necessary.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Descriptors-Child_Processes">
|
||||
<title>Preventing File Descriptor Leaks to Child Processes</title>
|
||||
<para>
|
||||
Child processes created with <function>fork</function> share
|
||||
the initial set of file descriptors with their parent
|
||||
process. By default, file descriptors are also preserved if
|
||||
a new process image is created with <function>execve</function>
|
||||
(or any of the other functions such as <function>system</function>
|
||||
or <function>posix_spawn</function>).
|
||||
</para>
|
||||
<para>
|
||||
Usually, this behavior is not desirable. There are two ways to
|
||||
turn it off, that is, to prevent new process images from
|
||||
inheriting the file descriptors in the parent process:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Set the close-on-exec flag on all newly created file
|
||||
descriptors. Traditionally, this flag is controlled by the
|
||||
<literal>FD_CLOEXEC</literal> flag, using
|
||||
<literal>F_GETFD</literal> and <literal>F_SETFD</literal>
|
||||
operations of the <function>fcntl</function> function.
|
||||
</para>
|
||||
<para>
|
||||
However, in a multi-threaded process, there is a race
|
||||
condition: a subprocess could have been created between the
|
||||
time the descriptor was created and the
|
||||
<literal>FD_CLOEXEC</literal> was set. Therefore, many system
|
||||
calls which create descriptors (such as
|
||||
<function>open</function> and <function>openat</function>)
|
||||
now accept the <function>O_CLOEXEC</function> flag
|
||||
(<function>SOCK_CLOEXEC</function> for
|
||||
<function>socket</function> and
|
||||
<function>socketpair</function>), which cause the
|
||||
<literal>FD_CLOEXEC</literal> flag to be set for the file
|
||||
descriptor in an atomic fashion. In addition, a few new
|
||||
systems calls were introduced, such as
|
||||
<function>pipe2</function> and <function>dup3</function>.
|
||||
</para>
|
||||
<para>
|
||||
The downside of this approach is that every descriptor needs
|
||||
to receive special treatment at the time of creation,
|
||||
otherwise it is not completely effective.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
After calling <function>fork</function>, but before creating
|
||||
a new process image with <function>execve</function>, all
|
||||
file descriptors which the child process will not need are
|
||||
closed.
|
||||
</para>
|
||||
<para>
|
||||
Traditionally, this was implemented as a loop over file
|
||||
descriptors ranging from <literal>3</literal> to
|
||||
<literal>255</literal> and later <literal>1023</literal>.
|
||||
But this is only an approximation because it is possible to
|
||||
create file descriptors outside this range easily (see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Descriptors-Limit"/>).
|
||||
Another approach reads <filename>/proc/self/fd</filename>
|
||||
and closes the unexpected descriptors listed there, but this
|
||||
approach is much slower.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
At present, environments which care about file descriptor
|
||||
leakage implement the second approach. OpenJDK 6 and 7
|
||||
are among them.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Descriptors-Limit">
|
||||
<title>Dealing with the <function>select</function> Limit</title>
|
||||
<para>
|
||||
By default, a user is allowed to open only 1024 files in a
|
||||
single process, but the system administrator can easily change
|
||||
this limit (which is necessary for busy network servers).
|
||||
However, there is another restriction which is more difficult to
|
||||
overcome.
|
||||
</para>
|
||||
<para>
|
||||
The <function>select</function> function only supports a
|
||||
maximum of <literal>FD_SETSIZE</literal> file descriptors
|
||||
(that is, the maximum permitted value for a file descriptor
|
||||
is <literal>FD_SETSIZE - 1</literal>, usually 1023.) If a
|
||||
process opens many files, descriptors may exceed such
|
||||
limits. It is impossible to query such descriptors using
|
||||
<function>select</function>.
|
||||
</para>
|
||||
<para>
|
||||
If a library which creates many file descriptors is used in
|
||||
the same process as a library which uses
|
||||
<function>select</function>, at least one of them needs to
|
||||
be changed. <!-- ??? refer to event-driven programming -->
|
||||
Calls to <function>select</function> can be replaced with
|
||||
calls to <function>poll</function> or another event handling
|
||||
mechanism. Replacing the <function>select</function> function
|
||||
is the recommended approach.
|
||||
</para>
|
||||
<para>
|
||||
Alternatively, the library with high descriptor usage can
|
||||
relocate descriptors above the <literal>FD_SETSIZE</literal>
|
||||
limit using the following procedure.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Create the file descriptor <literal>fd</literal> as
|
||||
usual, preferably with the <literal>O_CLOEXEC</literal>
|
||||
flag.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Before doing anything else with the descriptor
|
||||
<literal>fd</literal>, invoke:
|
||||
</para>
|
||||
<programlisting language="C">
|
||||
int newfd = fcntl(fd, F_DUPFD_CLOEXEC, (long)FD_SETSIZE);
|
||||
</programlisting>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Check that <literal>newfd</literal> result is
|
||||
non-negative, otherwise close <literal>fd</literal> and
|
||||
report an error, and return.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Close <literal>fd</literal> and continue to use
|
||||
<literal>newfd</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
The new descriptor has been allocated above the
|
||||
<literal>FD_SETSIZE</literal>. Even though this algorithm
|
||||
is racy in the sense that the <literal>FD_SETSIZE</literal>
|
||||
first descriptors could fill up, a very high degree of
|
||||
physical parallelism is required before this becomes a problem.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,339 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-File_System">
|
||||
<title>File System Manipulation</title>
|
||||
<para>
|
||||
In this chapter, we discuss general file system manipulation, with
|
||||
a focus on access files and directories to which an other,
|
||||
potentially untrusted user has write access.
|
||||
</para>
|
||||
<para>
|
||||
Temporary files are covered in their own chapter, <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-Temporary_Files"/>.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Tasks-File_System-Unowned">
|
||||
<title>Working with Files and Directories Owned by Other Users</title>
|
||||
<para>
|
||||
Sometimes, it is necessary to operate on files and directories
|
||||
owned by other (potentially untrusted) users. For example, a
|
||||
system administrator could remove the home directory of a user,
|
||||
or a package manager could update a file in a directory which is
|
||||
owned by an application-specific user. This differs from
|
||||
accessing the file system as a specific user; see
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-File_System-Foreign"/>.
|
||||
</para>
|
||||
<para>
|
||||
Accessing files across trust boundaries faces several
|
||||
challenges, particularly if an entire directory tree is being
|
||||
traversed:
|
||||
</para>
|
||||
<orderedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Another user might add file names to a writable directory at
|
||||
any time. This can interfere with file creation and the
|
||||
order of names returned by <function>readdir</function>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Merely opening and closing a file can have side effects.
|
||||
For instance, an automounter can be triggered, or a tape
|
||||
device rewound. Opening a file on a local file system can
|
||||
block indefinitely, due to mandatory file locking, unless
|
||||
the <literal>O_NONBLOCK</literal> flag is specified.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Hard links and symbolic links can redirect the effect of
|
||||
file system operations in unexpected ways. The
|
||||
<literal>O_NOFOLLOW</literal> and
|
||||
<literal>AT_SYMLINK_NOFOLLOW</literal> variants of system
|
||||
calls only affected final path name component.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The structure of a directory tree can change. For example,
|
||||
the parent directory of what used to be a subdirectory
|
||||
within the directory tree being processed could suddenly
|
||||
point outside that directory tree.
|
||||
</para>
|
||||
</listitem>
|
||||
</orderedlist>
|
||||
<para>
|
||||
Files should always be created with the
|
||||
<literal>O_CREAT</literal> and <literal>O_EXCL</literal> flags,
|
||||
so that creating the file will fail if it already exists. This
|
||||
guards against the unexpected appearance of file names, either
|
||||
due to creation of a new file, or hard-linking of an existing
|
||||
file. In multi-threaded programs, rather than manipulating the
|
||||
umask, create the files with mode <literal>000</literal> if
|
||||
possible, and adjust it afterwards with
|
||||
<function>fchmod</function>.
|
||||
</para>
|
||||
<para>
|
||||
To avoid issues related to symbolic links and directory tree
|
||||
restructuring, the “<literal>at</literal>” variants of system
|
||||
calls have to be used (that is, functions like
|
||||
<function>openat</function>, <function>fchownat</function>,
|
||||
<function>fchmodat</function>, and
|
||||
<function>unlinkat</function>, together with
|
||||
<literal>O_NOFOLLOW</literal> or
|
||||
<literal>AT_SYMLINK_NOFOLLOW</literal>). Path names passed to
|
||||
these functions must have just a single component (that is,
|
||||
without a slash). When descending, the descriptors of parent
|
||||
directories must be kept open. The missing
|
||||
<literal>opendirat</literal> function can be emulated with
|
||||
<literal>openat</literal> (with an
|
||||
<literal>O_DIRECTORY</literal> flag, to avoid opening special
|
||||
files with side effects), followed by
|
||||
<literal>fdopendir</literal>.
|
||||
</para>
|
||||
<para>
|
||||
If the “<literal>at</literal>” functions are not available, it
|
||||
is possible to emulate them by changing the current directory.
|
||||
(Obviously, this only works if the process is not multi-threaded.)
|
||||
<function>fchdir</function> has to be used to change the current
|
||||
directory, and the descriptors of the parent directories have to
|
||||
be kept open, just as with the “<literal>at</literal>”-based
|
||||
approach. <literal>chdir("...")</literal> is unsafe because it
|
||||
might ascend outside the intended directory tree.
|
||||
</para>
|
||||
<para>
|
||||
This “<literal>at</literal>” function emulation is currently
|
||||
required when manipulating extended attributes. In this case,
|
||||
the <function>lsetxattr</function> function can be used, with a
|
||||
relative path name consisting of a single component. This also
|
||||
applies to SELinux contexts and the
|
||||
<function>lsetfilecon</function> function.
|
||||
</para>
|
||||
<para>
|
||||
Currently, it is not possible to avoid opening special files
|
||||
<emphasis>and</emphasis> changes to files with hard links if the
|
||||
directory containing them is owned by an untrusted user.
|
||||
(Device nodes can be hard-linked, just as regular files.)
|
||||
<function>fchmodat</function> and <function>fchownat</function>
|
||||
affect files whose link count is greater than one. But opening
|
||||
the files, checking that the link count is one with
|
||||
<function>fstat</function>, and using
|
||||
<function>fchmod</function> and <function>fchown</function> on
|
||||
the file descriptor may have unwanted side effects, due to item
|
||||
2 above. When creating directories, it is therefore important
|
||||
to change the ownership and permissions only after it has been
|
||||
fully created. Until that point, file names are stable, and no
|
||||
files with unexpected hard links can be introduced.
|
||||
</para>
|
||||
<para>
|
||||
Similarly, when just reading a directory owned by an untrusted
|
||||
user, it is currently impossible to reliably avoid opening
|
||||
special files.
|
||||
</para>
|
||||
<para>
|
||||
There is no workaround against the instability of the file list
|
||||
returned by <function>readdir</function>. Concurrent
|
||||
modification of the directory can result in a list of files
|
||||
being returned which never actually existed on disk.
|
||||
</para>
|
||||
<para>
|
||||
Hard links and symbolic links can be safely deleted using
|
||||
<function>unlinkat</function> without further checks because
|
||||
deletion only affects the name within the directory tree being
|
||||
processed.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-File_System-Foreign">
|
||||
<title>Accessing the File System as a Different User</title>
|
||||
<para>
|
||||
This section deals with access to the file system as a specific
|
||||
user. This is different from accessing files and directories owned by a
|
||||
different, potentially untrusted user; see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-File_System-Foreign"/>.
|
||||
</para>
|
||||
<para>
|
||||
One approach is to spawn a child process which runs under the
|
||||
target user and group IDs (both effective and real IDs). Note
|
||||
that this child process can block indefinitely, even when
|
||||
processing regular files only. For example, a special FUSE file
|
||||
system could cause the process to hang in uninterruptible sleep
|
||||
inside a <function>stat</function> system call.
|
||||
</para>
|
||||
<para>
|
||||
An existing process could change its user and group ID using
|
||||
<function>setfsuid</function> and <function>setfsgid</function>.
|
||||
(These functions are preferred over <function>seteuid</function>
|
||||
and <function>setegid</function> because they do not allow the
|
||||
impersonated user to send signals to the process.) These
|
||||
functions are not thread safe. In multi-threaded processes,
|
||||
these operations need to be performed in a single-threaded child
|
||||
process. Unexpected blocking may occur as well.
|
||||
</para>
|
||||
<para>
|
||||
It is not recommended to try to reimplement the kernel
|
||||
permission checks in user space because the required checks are
|
||||
complex. It is also very difficult to avoid race conditions
|
||||
during path name resolution.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-File_System-Limits">
|
||||
<title>File System Limits</title>
|
||||
<para>
|
||||
For historical reasons, there are preprocessor constants such as
|
||||
<literal>PATH_MAX</literal>, <literal>NAME_MAX</literal>.
|
||||
However, on most systems, the length of canonical path names
|
||||
(absolute path names with all symbolic links resolved, as
|
||||
returned by <function>realpath</function> or
|
||||
<function>canonicalize_file_name</function>) can exceed
|
||||
<literal>PATH_MAX</literal> bytes, and individual file name
|
||||
components can be longer than <literal>NAME_MAX</literal>. This
|
||||
is also true of the <literal>_PC_PATH_MAX</literal> and
|
||||
<literal>_PC_NAME_MAX</literal> values returned by
|
||||
<function>pathconf</function>, and the
|
||||
<literal>f_namemax</literal> member of <literal>struct
|
||||
statvfs</literal>. Therefore, these constants should not be
|
||||
used. This is also reason why the
|
||||
<function>readdir_r</function> should never be used (instead,
|
||||
use <function>readdir</function>).
|
||||
</para>
|
||||
<para>
|
||||
You should not write code in a way that assumes that there is an
|
||||
upper limit on the number of subdirectories of a directory, the
|
||||
number of regular files in a directory, or the link count of an
|
||||
inode.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-File_System-Features">
|
||||
<title>File system features</title>
|
||||
<para>
|
||||
Not all file systems support all features. This makes it very
|
||||
difficult to write general-purpose tools for copying files. For
|
||||
example, a copy operation intending to preserve file permissions
|
||||
will generally fail when copying to a FAT file system.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Some file systems are case-insensitive. Most should be
|
||||
case-preserving, though.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Name length limits vary greatly, from eight to thousands of
|
||||
bytes. Path length limits differ as well. Most systems
|
||||
impose an upper bound on path names passed to the kernel,
|
||||
but using relative path names, it is possible to create and
|
||||
access files whose absolute path name is essentially of
|
||||
unbounded length.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Some file systems do not store names as fairly unrestricted
|
||||
byte sequences, as it has been traditionally the case on GNU
|
||||
systems. This means that some byte sequences (outside the
|
||||
POSIX safe character set) are not valid names. Conversely,
|
||||
names of existing files may not be representable as byte
|
||||
sequences, and the files are thus inaccessible on GNU
|
||||
systems. Some file systems perform Unicode canonicalization
|
||||
on file names. These file systems preserve case, but
|
||||
reading the name of a just-created file using
|
||||
<function>readdir</function> might still result in a
|
||||
different byte sequence.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Permissions and owners are not universally supported (and
|
||||
SUID/SGID bits may not be available). For example, FAT file
|
||||
systems assign ownership based on a mount option, and
|
||||
generally mark all files as executable. Any attempt to
|
||||
change permissions would result in an error.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Non-regular files (device nodes, FIFOs) are not generally
|
||||
available.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Only on some file systems, files can have holes, that is,
|
||||
not all of their contents is backed by disk storage.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<function>ioctl</function> support (even fairly generic
|
||||
functionality such as <literal>FIEMAP</literal> for
|
||||
discovering physical file layout and holes) is
|
||||
file-system-specific.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Not all file systems support extended attributes, ACLs and
|
||||
SELinux metadata. Size and naming restriction on extended
|
||||
attributes vary.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Hard links may not be supported at all (FAT) or only within
|
||||
the same directory (AFS). Symbolic links may not be
|
||||
available, either. Reflinks (hard links with copy-on-write
|
||||
semantics) are still very rare. Recent systems restrict
|
||||
creation of hard links to users which own the target file or
|
||||
have read/write access to it, but older systems do not.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Renaming (or moving) files using <function>rename</function>
|
||||
can fail (even when <function>stat</function> indicates that
|
||||
the source and target directories are located on the same
|
||||
file system). This system call should work if the old and
|
||||
new paths are located in the same directory, though.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Locking semantics vary among file systems. This affects
|
||||
advisory and mandatory locks. For example, some network
|
||||
file systems do not allow deleting files which are opened by
|
||||
any process.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Resolution of time stamps varies from two seconds to
|
||||
nanoseconds. Not all time stamps are available on all file
|
||||
systems. File creation time (<emphasis>birth
|
||||
time</emphasis>) is not exposed over the
|
||||
<function>stat</function>/<function>fstat</function>
|
||||
interface, even if stored by the file system.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-File_System-Free_Space">
|
||||
<title>Checking Free Space</title>
|
||||
<para>
|
||||
The <function>statvfs</function> and
|
||||
<function>fstatvfs</function> functions allow programs to
|
||||
examine the number of available blocks and inodes, through the
|
||||
members <literal>f_bfree</literal>, <literal>f_bavail</literal>,
|
||||
<literal>f_ffree</literal>, and <literal>f_favail</literal> of
|
||||
<literal>struct statvfs</literal>. Some file systems return
|
||||
fictional values in the <literal>f_ffree</literal> and
|
||||
<literal>f_favail</literal> fields, so the only reliable way to
|
||||
discover if the file system still has space for a file is to try
|
||||
to create it. The <literal>f_bfree</literal> field should be
|
||||
reasonably accurate, though.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
||||
|
|
@ -1,195 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-Library_Design">
|
||||
<title>Library Design</title>
|
||||
<para>
|
||||
Through this section, the term <emphasis>client code</emphasis>
|
||||
refers to applications and other libraries using the library.
|
||||
</para>
|
||||
|
||||
<section>
|
||||
<title>State Management</title>
|
||||
<para>
|
||||
</para>
|
||||
<section>
|
||||
<title>Global State</title>
|
||||
<para>
|
||||
Global state should be avoided.
|
||||
</para>
|
||||
<para>
|
||||
If this is impossible, the global state must be protected with
|
||||
a lock. For C/C++, you can use the
|
||||
<function>pthread_mutex_lock</function>
|
||||
and <function>pthread_mutex_unlock</function>
|
||||
functions without linking against <literal>-lpthread</literal>
|
||||
because the system provides stubs for non-threaded processes.
|
||||
</para>
|
||||
<para>
|
||||
For compatibility with <function>fork</function>, these locks
|
||||
should be acquired and released in helpers registered with
|
||||
<function>pthread_atfork</function>. This function is not
|
||||
available without <literal>-lpthread</literal>, so you need to
|
||||
use <function>dlsym</function> or a weak symbol to obtain its
|
||||
address.
|
||||
</para>
|
||||
<para>
|
||||
If you need <function>fork</function> protection for other
|
||||
reasons, you should store the process ID and compare it to the
|
||||
value returned by <function>getpid</function> each time you
|
||||
access the global state. (<function>getpid</function> is not
|
||||
implemented as a system call and is fast.) If the value
|
||||
changes, you know that you have to re-create the state object.
|
||||
(This needs to be combined with locking, of course.)
|
||||
</para>
|
||||
</section>
|
||||
<section>
|
||||
<title>Handles</title>
|
||||
<para>
|
||||
Library state should be kept behind a curtain. Client code
|
||||
should receive only a handle. In C, the handle can be a
|
||||
pointer to an incomplete <literal>struct</literal>. In C++,
|
||||
the handle can be a pointer to an abstract base class, or it
|
||||
can be hidden using the pointer-to-implementation idiom.
|
||||
</para>
|
||||
<para>
|
||||
The library should provide functions for creating and
|
||||
destroying handles. (In C++, it is possible to use virtual
|
||||
destructors for the latter.) Consistency between creation and
|
||||
destruction of handles is strongly recommended: If the client
|
||||
code created a handle, it is the responsibility of the client
|
||||
code to destroy it. (This is not always possible or
|
||||
convenient, so sometimes, a transfer of ownership has to
|
||||
happen.)
|
||||
</para>
|
||||
<para>
|
||||
Using handles ensures that it is possible to change the way
|
||||
the library represents state in a way that is transparent to
|
||||
client code. This is important to facilitate security updates
|
||||
and many other code changes.
|
||||
</para>
|
||||
<para>
|
||||
It is not always necessary to protect state behind a handle
|
||||
with a lock. This depends on the level of thread safety
|
||||
the library provides.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Object Orientation</title>
|
||||
<para>
|
||||
Classes should be either designed as base classes, or it should
|
||||
be impossible to use them as base classes (like
|
||||
<literal>final</literal> classes in Java). Classes which are
|
||||
not designed for inheritance and are used as base classes
|
||||
nevertheless create potential maintenance hazards because it is
|
||||
difficult to predict how client code will react when calls to
|
||||
virtual methods are added, reordered or removed.
|
||||
</para>
|
||||
<para>
|
||||
Virtual member functions can be used as callbacks. See
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-Library_Design-Callbacks"/>
|
||||
for some of the challenges involved.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Library_Design-Callbacks">
|
||||
<title>Callbacks</title>
|
||||
<para>
|
||||
Higher-order code is difficult to analyze for humans and
|
||||
computers alike, so it should be avoided. Often, an
|
||||
iterator-based interface (a library function which is called
|
||||
repeatedly by client code and returns a stream of events) leads
|
||||
to a better design which is easier to document and use.
|
||||
</para>
|
||||
<para>
|
||||
If callbacks are unavoidable, some guidelines for them follow.
|
||||
</para>
|
||||
<para>
|
||||
In modern C++ code, <literal>std::function</literal> objects
|
||||
should be used for callbacks.
|
||||
</para>
|
||||
<para>
|
||||
In older C++ code and in C code, all callbacks must have an
|
||||
additional closure parameter of type <literal>void *</literal>,
|
||||
the value of which can be specified by client code. If
|
||||
possible, the value of the closure parameter should be provided
|
||||
by client code at the same time a specific callback is
|
||||
registered (or specified as a function argument). If a single
|
||||
closure parameter is shared by multiple callbacks, flexibility
|
||||
is greatly reduced, and conflicts between different pieces of
|
||||
client code using the same library object could be unresolvable.
|
||||
In some cases, it makes sense to provide a de-registration
|
||||
callback which can be used to destroy the closure parameter when
|
||||
the callback is no longer used.
|
||||
</para>
|
||||
<para>
|
||||
Callbacks can throw exceptions or call
|
||||
<function>longjmp</function>. If possible, all library objects
|
||||
should remain in a valid state. (All further operations on them
|
||||
can fail, but it should be possible to deallocate them without
|
||||
causing resource leaks.)
|
||||
</para>
|
||||
<para>
|
||||
The presence of callbacks raises the question if functions
|
||||
provided by the library are <emphasis>reentrant</emphasis>.
|
||||
Unless a library was designed for such use, bad things will
|
||||
happen if a callback function uses functions in the same library
|
||||
(particularly if they are invoked on the same objects and
|
||||
manipulate the same state). When the callback is invoked, the
|
||||
library can be in an inconsistent state. Reentrant functions
|
||||
are more difficult to write than thread-safe functions (by
|
||||
definition, simple locking would immediately lead to deadlocks).
|
||||
It is also difficult to decide what to do when destruction of an
|
||||
object which is currently processing a callback is requested.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Process Attributes</title>
|
||||
<para>
|
||||
Several attributes are global and affect all code in the
|
||||
process, not just the library that manipulates them.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>
|
||||
environment variables
|
||||
(see <xref linkend="sect-Defensive_Coding-Tasks-secure_getenv"/>)
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
umask
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
user IDs, group IDs and capabilities
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
current working directory
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
signal handlers, signal masks and signal delivery
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
file locks (especially <function>fcntl</function> locks
|
||||
behave in surprising ways, not just in a multi-threaded
|
||||
environment)
|
||||
</para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Library code should avoid manipulating these global process
|
||||
attributes. It should not rely on environment variables, umask,
|
||||
the current working directory and signal masks because these
|
||||
attributes can be inherited from an untrusted source.
|
||||
</para>
|
||||
<para>
|
||||
In addition, there are obvious process-wide aspects such as the
|
||||
virtual memory layout, the set of open files and dynamic shared
|
||||
objects, but with the exception of shared objects, these can be
|
||||
manipulated in a relatively isolated way.
|
||||
</para>
|
||||
|
||||
</section>
|
||||
|
||||
</chapter>
|
||||
|
||||
|
|
@ -1,5 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="sect-Defensive_Coding-Tasks-Locking">
|
||||
</chapter>
|
|
@ -1,183 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-Packaging">
|
||||
<title>RPM Packaging</title>
|
||||
<para>
|
||||
This chapter deals with security-related concerns around RPM
|
||||
packaging. It has to be read in conjunction with
|
||||
distribution-specific packaging guidelines.
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Tasks-Packaging-Certificates">
|
||||
<title>Generating X.509 Self-signed Certificates during
|
||||
Installation</title>
|
||||
<para>
|
||||
Some applications need X.509 certificates for authentication
|
||||
purposes. For example, a single private/public key pair could
|
||||
be used to define cluster membership, enabling authentication
|
||||
and encryption of all intra-cluster communication. (Lack of
|
||||
certification from a CA matters less in such a context.) For
|
||||
such use, generating the key pair at package installation time
|
||||
when preparing system images for use in the cluster is
|
||||
reasonable. For other use cases, it is necessary to generate
|
||||
the key pair before the service is started for the first time,
|
||||
see <xref linkend="sect-Defensive_Coding-Tasks-Packaging-Certificates-Service"/>,
|
||||
and <ulink url="https://fedoraproject.org/wiki/Packaging:Initial_Service_Setup#Generating_Self-Signed_Certificates">Packaging:Initial Service Setup</ulink>.
|
||||
</para>
|
||||
<important>
|
||||
<para>
|
||||
The way the key is generated may not be suitable for key
|
||||
material of critical value. (<command>openssl
|
||||
genrsa</command> uses, but does not require, entropy from a
|
||||
physical source of randomness, among other things.) Such keys
|
||||
should be stored in a hardware security module if possible,
|
||||
and generated from random bits reserved for this purpose
|
||||
derived from a non-deterministic physical source.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
In the spec file, we define two RPM variables which contain the
|
||||
names of the files used to store the private and public key, and
|
||||
the user name for the service:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="RPM Spec">
|
||||
# Name of the user owning the file with the private key
|
||||
%define tlsuser %{name}
|
||||
# Name of the directory which contains the key and certificate files
|
||||
%define tlsdir %{_sysconfdir}/%{name}
|
||||
%define tlskey %{tlsdir}/%{name}.key
|
||||
%define tlscert %{tlsdir}/%{name}.crt
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
<para>
|
||||
These variables likely need adjustment based on the needs of the
|
||||
package.
|
||||
</para>
|
||||
<para>
|
||||
Typically, the file with the private key needs to be owned by
|
||||
the system user which needs to read it,
|
||||
<literal>%{tlsuser}</literal> (not <literal>root</literal>). In
|
||||
order to avoid races, if the <emphasis>directory</emphasis>
|
||||
<literal>%{tlsdir}</literal> is <emphasis>owned by the services
|
||||
user</emphasis>, you should use the code in <xref
|
||||
linkend="ex-Defensive_Coding-Packaging-Certificates-Owned"/>.
|
||||
The invocation of <application>su</application> with the
|
||||
<option>-s /bin/bash</option> argument is necessary in case the
|
||||
login shell for the user has been disabled.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Packaging-Certificates-Owned">
|
||||
<title>Creating a key pair in a user-owned directory</title>
|
||||
<programlisting language="Bash">
|
||||
%post
|
||||
if [ $1 -eq 1 ] ; then
|
||||
if ! test -e %{tlskey} ; then
|
||||
su -s /bin/bash \
|
||||
-c "umask 077 && openssl genrsa -out %{tlskey} 2048 2>/dev/null" \
|
||||
%{tlsuser}
|
||||
fi
|
||||
if ! test -e %{tlscert} ; then
|
||||
cn="Automatically generated certificate for the %{tlsuser} service"
|
||||
req_args="-key %{tlskey} -out %{tlscert} -days 7305 -subj \"/CN=$cn/\""
|
||||
su -s /bin/bash \
|
||||
-c "openssl req -new -x509 -extensions usr_cert $req_args" \
|
||||
%{tlsuser}
|
||||
fi
|
||||
fi
|
||||
|
||||
%files
|
||||
%dir %attr(0755,%{tlsuser},%{tlsuser]) %{tlsdir}
|
||||
%ghost %attr(0600,%{tlsuser},%{tlsuser}) %config(noreplace) %{tlskey}
|
||||
%ghost %attr(0644,%{tlsuser},%{tlsuser}) %config(noreplace) %{tlscert}
|
||||
</programlisting>
|
||||
</example>
|
||||
<para>
|
||||
The files containing the key material are marked as ghost
|
||||
configuration files. This ensures that they are tracked in the
|
||||
RPM database as associated with the package, but RPM will not
|
||||
create them when the package is installed and not verify their
|
||||
contents (the <literal>%ghost</literal>), or delete the files
|
||||
when the package is uninstalled (the
|
||||
<literal>%config(noreplace)</literal> part).
|
||||
</para>
|
||||
<para>
|
||||
If the <emphasis>directory</emphasis>
|
||||
<literal>%{tlsdir}</literal> <emphasis>is owned by</emphasis>
|
||||
<literal>root</literal>, use the code in <xref
|
||||
linkend="ex-Defensive_Coding-Packaging-Certificates-Unowned"/>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Packaging-Certificates-Unowned">
|
||||
<title>Creating a key pair in a <literal>root</literal>-owned directory</title>
|
||||
<programlisting language="Bash">
|
||||
%post
|
||||
if [ $1 -eq 1 ] ; then
|
||||
if ! test -e %{tlskey} ; then
|
||||
(umask 077 && openssl genrsa -out %{tlskey} 2048 2>/dev/null)
|
||||
chown %{tlsuser} %{tlskey}
|
||||
fi
|
||||
if ! test -e %{tlscert} ; then
|
||||
cn="Automatically generated certificate for the %{tlsuser} service"
|
||||
openssl req -new -x509 -extensions usr_cert \
|
||||
-key %{tlskey} -out %{tlscert} -days 7305 -subj "/CN=$cn/"
|
||||
fi
|
||||
fi
|
||||
|
||||
%files
|
||||
%dir %attr(0755,root,root]) %{tlsdir}
|
||||
%ghost %attr(0600,%{tlsuser},%{tlsuser}) %config(noreplace) %{tlskey}
|
||||
%ghost %attr(0644,root,root) %config(noreplace) %{tlscert}
|
||||
</programlisting>
|
||||
</example>
|
||||
<para>
|
||||
In order for this to work, the package which generates the keys
|
||||
must require the <application>openssl</application> package. If
|
||||
the user which owns the key file is generated by a different
|
||||
package, the package generating the certificate must specify a
|
||||
<literal>Requires(pre):</literal> on the package which creates
|
||||
the user. This ensures that the user account will exist when it
|
||||
is needed for the <application>su</application> or
|
||||
<application>chmod</application> invocation.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-Packaging-Certificates-Service">
|
||||
<title>Generating X.509 Self-signed Certificates before Service
|
||||
Start</title>
|
||||
<para>
|
||||
An alternative way to automatically provide an X.509 key pair is
|
||||
to create it just before the service is started for the first
|
||||
time. This ensures that installation images which are created
|
||||
from installed RPM packages receive different key material.
|
||||
Creating the key pair at package installation time (see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Packaging-Certificates"/>)
|
||||
would put the key into the image, which may or may not make
|
||||
sense. </para>
|
||||
<important>
|
||||
<para>
|
||||
The caveats about the way the key is generated in <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Packaging-Certificates"/>
|
||||
apply to this procedure as well.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
Generating key material before service start may happen very
|
||||
early during boot, when the kernel randomness pool has not yet
|
||||
been initialized. Currently, the only way to check for the
|
||||
initialization is to look for the kernel message
|
||||
<literal>random: nonblocking pool is initialized</literal>, or
|
||||
ensure that the application used for generating the keys
|
||||
is utilizing the <filename>getrandom()</filename> system call.
|
||||
</para>
|
||||
<para>
|
||||
In theory, it is also possible to use an application which reads from
|
||||
<filename>/dev/random</filename> while generating the key
|
||||
material (instead of <filename>/dev/urandom</filename>), but
|
||||
this can block not just during the boot process, but also much
|
||||
later at run time, and generally results in a poor user
|
||||
experience.
|
||||
</para>
|
||||
<para>
|
||||
The requirements for generating such keys is documented at
|
||||
<ulink url="https://fedoraproject.org/wiki/Packaging:Initial_Service_Setup#Generating_Self-Signed_Certificates">Packaging:Initial Service Setup</ulink>.
|
||||
</para>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,483 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="sect-Defensive_Coding-Tasks-Processes">
|
||||
<title>Processes</title>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-Creation">
|
||||
<title>Creating Safe Processes</title>
|
||||
<para>
|
||||
This section describes how to create new child processes in a
|
||||
safe manner. In addition to the concerns addressed below, there
|
||||
is the possibility of file descriptor leaks, see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Descriptors-Child_Processes"/>.
|
||||
</para>
|
||||
<section>
|
||||
<title>Obtaining the Program Path and the Command-line
|
||||
Template</title>
|
||||
<para>
|
||||
The name and path to the program being invoked should be
|
||||
hard-coded or controlled by a static configuration file stored
|
||||
at a fixed location (at an file system absolute path). The
|
||||
same applies to the template for generating the command line.
|
||||
</para>
|
||||
<para>
|
||||
The configured program name should be an absolute path. If it
|
||||
is a relative path, the contents of the <envar>PATH</envar>
|
||||
must be obtained in a secure manner (see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-secure_getenv"/>).
|
||||
If the <envar>PATH</envar> variable is not set or untrusted,
|
||||
the safe default <literal>/bin:/usr/bin</literal> must be
|
||||
used.
|
||||
</para>
|
||||
<para>
|
||||
If too much flexibility is provided here, it may allow
|
||||
invocation of arbitrary programs without proper authorization.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-execve">
|
||||
<title>Bypassing the Shell</title>
|
||||
<para>
|
||||
Child processes should be created without involving the system
|
||||
shell.
|
||||
</para>
|
||||
<para>
|
||||
For C/C++, <function>system</function> should not be used.
|
||||
The <function>posix_spawn</function> function can be used
|
||||
instead, or a combination <function>fork</function> and
|
||||
<function>execve</function>. (In some cases, it may be
|
||||
preferable to use <function>vfork</function> or the
|
||||
Linux-specific <function>clone</function> system call instead
|
||||
of <function>fork</function>.)
|
||||
</para>
|
||||
<para>
|
||||
In Python, the <literal>subprocess</literal> module bypasses
|
||||
the shell by default (when the <literal>shell</literal>
|
||||
keyword argument is not set to true).
|
||||
<function>os.system</function> should not be used.
|
||||
</para>
|
||||
<para>
|
||||
The Java class <type>java.lang.ProcessBuilder</type> can be
|
||||
used to create subprocesses without interference from the
|
||||
system shell.
|
||||
</para>
|
||||
<important>
|
||||
<title>Portability notice</title>
|
||||
<para>
|
||||
On Windows, there is no argument vector, only a single
|
||||
argument string. Each application is responsible for parsing
|
||||
this string into an argument vector. There is considerable
|
||||
variance among the quoting style recognized by applications.
|
||||
Some of them expand shell wildcards, others do not. Extensive
|
||||
application-specific testing is required to make this secure.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
Note that some common applications (notably
|
||||
<application>ssh</application>) unconditionally introduce the
|
||||
use of a shell, even if invoked directly without a shell. It is
|
||||
difficult to use these applications in a secure manner. In this
|
||||
case, untrusted data should be supplied by other means. For
|
||||
example, standard input could be used, instead of the command
|
||||
line.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-environ">
|
||||
<title>Specifying the Process Environment</title>
|
||||
<para>
|
||||
Child processes should be created with a minimal set of
|
||||
environment variables. This is absolutely essential if there
|
||||
is a trust transition involved, either when the parent process
|
||||
was created, or during the creation of the child process.
|
||||
</para>
|
||||
<para>
|
||||
In C/C++, the environment should be constructed as an array of
|
||||
strings and passed as the <varname>envp</varname> argument to
|
||||
<function>posix_spawn</function> or <function>execve</function>.
|
||||
The functions <function>setenv</function>,
|
||||
<function>unsetenv</function> and <function>putenv</function>
|
||||
should not be used. They are not thread-safe and suffer from
|
||||
memory leaks.
|
||||
</para>
|
||||
<para>
|
||||
Python programs need to specify a <literal>dict</literal> for
|
||||
the the <varname>env</varname> argument of the
|
||||
<function>subprocess.Popen</function> constructor.
|
||||
The Java class <literal>java.lang.ProcessBuilder</literal>
|
||||
provides a <function>environment()</function> method,
|
||||
which returns a map that can be manipulated.
|
||||
</para>
|
||||
<para>
|
||||
The following list provides guidelines for selecting the set
|
||||
of environment variables passed to the child process.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
<envar>PATH</envar> should be initialized to
|
||||
<literal>/bin:/usr/bin</literal>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
<envar>USER</envar> and <envar>HOME</envar> can be inhereted
|
||||
from the parent process environment, or they can be
|
||||
initialized from the <literal>pwent</literal> structure
|
||||
for the user. <!-- ??? refer to dropping privileges -->
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>The <envar>DISPLAY</envar> and <envar>XAUTHORITY</envar>
|
||||
variables should be passed to the subprocess if it is an X
|
||||
program. Note that this will typically not work across trust
|
||||
boundaries because <envar>XAUTHORITY</envar> refers to a file
|
||||
with <literal>0600</literal> permissions.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The location-related environment variables
|
||||
<envar>LANG</envar>, <envar>LANGUAGE</envar>,
|
||||
<envar>LC_ADDRESS</envar>, <envar>LC_ALL</envar>,
|
||||
<envar>LC_COLLATE</envar>, <envar>LC_CTYPE</envar>,
|
||||
<envar>LC_IDENTIFICATION</envar>,
|
||||
<envar>LC_MEASUREMENT</envar>, <envar>LC_MESSAGES</envar>,
|
||||
<envar>LC_MONETARY</envar>, <envar>LC_NAME</envar>,
|
||||
<envar>LC_NUMERIC</envar>, <envar>LC_PAPER</envar>,
|
||||
<envar>LC_TELEPHONE</envar> and <envar>LC_TIME</envar>
|
||||
can be passed to the subprocess if present.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The called process may need application-specific
|
||||
environment variables, for example for passing passwords.
|
||||
(See <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Processes-Command_Line_Visibility"/>.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
All other environment variables should be dropped. Names
|
||||
for new environment variables should not be accepted from
|
||||
untrusted sources.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Robust Argument List Processing</title>
|
||||
<para>
|
||||
When invoking a program, it is sometimes necessary to include
|
||||
data from untrusted sources. Such data should be checked
|
||||
against embedded <literal>NUL</literal> characters because the
|
||||
system APIs will silently truncate argument strings at the first
|
||||
<literal>NUL</literal> character.
|
||||
</para>
|
||||
<para>
|
||||
The following recommendations assume that the program being
|
||||
invoked uses GNU-style option processing using
|
||||
<function>getopt_long</function>. This convention is widely
|
||||
used, but it is just that, and individual programs might
|
||||
interpret a command line in a different way.
|
||||
</para>
|
||||
<para>
|
||||
If the untrusted data has to go into an option, use the
|
||||
<literal>--option-name=VALUE</literal> syntax, placing the
|
||||
option and its value into the same command line argument.
|
||||
This avoids any potential confusion if the data starts with
|
||||
<literal>-</literal>.
|
||||
</para>
|
||||
<para>
|
||||
For positional arguments, terminate the option list with a
|
||||
single <option>--</option> marker after the last option, and
|
||||
include the data at the right position. The
|
||||
<option>--</option> marker terminates option processing, and
|
||||
the data will not be treated as an option even if it starts
|
||||
with a dash.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-Command_Line_Visibility">
|
||||
<title>Passing Secrets to Subprocesses</title>
|
||||
<para>
|
||||
The command line (the name of the program and its argument) of
|
||||
a running process is traditionally available to all local
|
||||
users. The called program can overwrite this information, but
|
||||
only after it has run for a bit of time, during which the
|
||||
information may have been read by other processes. However,
|
||||
on Linux, the process environment is restricted to the user
|
||||
who runs the process. Therefore, if you need a convenient way
|
||||
to pass a password to a child process, use an environment
|
||||
variable, and not a command line argument. (See <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Processes-environ"/>.)
|
||||
</para>
|
||||
<important>
|
||||
<title>Portability notice</title>
|
||||
<para>
|
||||
On some UNIX-like systems (notably Solaris), environment
|
||||
variables can be read by any system user, just like command
|
||||
lines.
|
||||
</para>
|
||||
</important>
|
||||
<para>
|
||||
If the environment-based approach cannot be used due to
|
||||
portability concerns, the data can be passed on standard
|
||||
input. Some programs (notably <application>gpg</application>)
|
||||
use special file descriptors whose numbers are specified on
|
||||
the command line. Temporary files are an option as well, but
|
||||
they might give digital forensics access to sensitive data
|
||||
(such as passphrases) because it is difficult to safely delete
|
||||
them in all cases.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Handling Child Process Termination</title>
|
||||
<para>
|
||||
When child processes terminate, the parent process is signalled.
|
||||
A stub of the terminated processes (a
|
||||
<emphasis>zombie</emphasis>, shown as
|
||||
<literal><defunct></literal> by
|
||||
<application>ps</application>) is kept around until the status
|
||||
information is collected (<emphasis>reaped</emphasis>) by the
|
||||
parent process. Over the years, several interfaces for this
|
||||
have been invented:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The parent process calls <function>wait</function>,
|
||||
<function>waitpid</function>, <function>waitid</function>,
|
||||
<function>wait3</function> or <function>wait4</function>,
|
||||
without specifying a process ID. This will deliver any
|
||||
matching process ID. This approach is typically used from
|
||||
within event loops.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The parent process calls <function>waitpid</function>,
|
||||
<function>waitid</function>, or <function>wait4</function>,
|
||||
with a specific process ID. Only data for the specific
|
||||
process ID is returned. This is typically used in code
|
||||
which spawns a single subprocess in a synchronous manner.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The parent process installs a handler for the
|
||||
<literal>SIGCHLD</literal> signal, using
|
||||
<function>sigaction</function>, and specifies to the
|
||||
<literal>SA_NOCLDWAIT</literal> flag.
|
||||
This approach could be used by event loops as well.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
None of these approaches can be used to wait for child process
|
||||
terminated in a completely thread-safe manner. The parent
|
||||
process might execute an event loop in another thread, which
|
||||
could pick up the termination signal. This means that libraries
|
||||
typically cannot make free use of child processes (for example,
|
||||
to run problematic code with reduced privileges in a separate
|
||||
address space).
|
||||
</para>
|
||||
<para>
|
||||
At the moment, the parent process should explicitly wait for
|
||||
termination of the child process using
|
||||
<function>waitpid</function> or <function>waitid</function>,
|
||||
and hope that the status is not collected by an event loop
|
||||
first.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title><literal>SUID</literal>/<literal>SGID</literal>
|
||||
processes</title>
|
||||
<!-- ??? need to document real vs effective UID -->
|
||||
<para>
|
||||
Programs can be marked in the file system to indicate to the
|
||||
kernel that a trust transition should happen if the program is
|
||||
run. The <literal>SUID</literal> file permission bit indicates
|
||||
that an executable should run with the effective user ID equal
|
||||
to the owner of the executable file. Similarly, with the
|
||||
<literal>SGID</literal> bit, the effective group ID is set to
|
||||
the group of the executable file.
|
||||
</para>
|
||||
<para>
|
||||
Linux supports <emphasis>fscaps</emphasis>, which can grant
|
||||
additional capabilities to a process in a finer-grained manner.
|
||||
Additional mechanisms can be provided by loadable security
|
||||
modules.
|
||||
</para>
|
||||
<para>
|
||||
When such a trust transition has happened, the process runs in a
|
||||
potentially hostile environment. Additional care is necessary
|
||||
not to rely on any untrusted information. These concerns also
|
||||
apply to libraries which can be linked into such processes.
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-secure_getenv">
|
||||
<title>Accessing Environment Variables</title>
|
||||
<para>
|
||||
The following steps are required so that a program does not
|
||||
accidentally pick up untrusted data from environment
|
||||
variables.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>
|
||||
Compile your C/C++ sources with <literal>-D_GNU_SOURCE</literal>.
|
||||
The Autoconf macro <literal>AC_GNU_SOURCE</literal> ensures this.
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Check for the presence of the <function>secure_getenv</function>
|
||||
and <function>__secure_getenv</function> function. The Autoconf
|
||||
directive <literal>AC_CHECK_FUNCS([__secure_getenv secure_getenv])</literal>
|
||||
performs these checks.
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Arrange for a proper definition of the
|
||||
<function>secure_getenv</function> function. See <xref
|
||||
linkend="ex-Defensive_Coding-Tasks-secure_getenv"/>.
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Use <function>secure_getenv</function> instead of
|
||||
<function>getenv</function> to obtain the value of critical
|
||||
environment variables. <function>secure_getenv</function>
|
||||
will pretend the variable has not bee set if the process
|
||||
environment is not trusted.
|
||||
</para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Critical environment variables are debugging flags,
|
||||
configuration file locations, plug-in and log file locations,
|
||||
and anything else that might be used to bypass security
|
||||
restrictions or cause a privileged process to behave in an
|
||||
unexpected way.
|
||||
</para>
|
||||
<para>
|
||||
Either the <function>secure_getenv</function> function or the
|
||||
<function>__secure_getenv</function> is available from GNU libc.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-secure_getenv">
|
||||
<title>Obtaining a definition for <function>secure_getenv</function></title>
|
||||
<programlisting language="C">
|
||||
<![CDATA[
|
||||
#include <stdlib.h>
|
||||
|
||||
#ifndef HAVE_SECURE_GETENV
|
||||
# ifdef HAVE__SECURE_GETENV
|
||||
# define secure_getenv __secure_getenv
|
||||
# else
|
||||
# error neither secure_getenv nor __secure_getenv are available
|
||||
# endif
|
||||
#endif
|
||||
]]>
|
||||
</programlisting>
|
||||
</example>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-Daemons">
|
||||
<title>Daemons</title>
|
||||
<para>
|
||||
Background processes providing system services
|
||||
(<emphasis>daemons</emphasis>) need to decouple themselves from
|
||||
the controlling terminal and the parent process environment:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>Fork.</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
In the child process, call <function>setsid</function>. The
|
||||
parent process can simply exit (using
|
||||
<function>_exit</function>, to avoid running clean-up
|
||||
actions twice).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
In the child process, fork again. Processing continues in
|
||||
the child process. Again, the parent process should just
|
||||
exit.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Replace the descriptors 0, 1, 2 with a descriptor for
|
||||
<filename>/dev/null</filename>. Logging should be
|
||||
redirected to <application>syslog</application>.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Older instructions for creating daemon processes recommended a
|
||||
call to <literal>umask(0)</literal>. This is risky because it
|
||||
often leads to world-writable files and directories, resulting
|
||||
in security vulnerabilities such as arbitrary process
|
||||
termination by untrusted local users, or log file truncation.
|
||||
If the <emphasis>umask</emphasis> needs setting, a restrictive
|
||||
value such as <literal>027</literal> or <literal>077</literal>
|
||||
is recommended.
|
||||
</para>
|
||||
<para>
|
||||
Other aspects of the process environment may have to changed as
|
||||
well (environment variables, signal handler disposition).
|
||||
</para>
|
||||
<para>
|
||||
It is increasingly common that server processes do not run as
|
||||
background processes, but as regular foreground process under a
|
||||
supervising master process (such as
|
||||
<application>systemd</application>). Server processes should
|
||||
offer a command line option which disables forking and
|
||||
replacement of the standard output and standard error streams.
|
||||
Such an option is also useful for debugging.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Semantics of Command-line Arguments</title>
|
||||
<!-- ??? This applies in two ways, safely calling an other process
|
||||
and support for being called safely. Also need to address
|
||||
untrusted current directory on USB sticks. -->
|
||||
<para>
|
||||
After process creation and option processing, it is up to the
|
||||
child process to interpret the arguments. Arguments can be
|
||||
file names, host names, or URLs, and many other things. URLs
|
||||
can refer to the local network, some server on the Internet,
|
||||
or to the local file system. Some applications even accept
|
||||
arbitrary code in arguments (for example,
|
||||
<application>python</application> with the
|
||||
<option>-c</option> option).
|
||||
</para>
|
||||
<para>
|
||||
Similar concerns apply to environment variables, the contents
|
||||
of the current directory and its subdirectories.
|
||||
<!-- ??? refer to section on temporary directories -->
|
||||
</para>
|
||||
<para>
|
||||
Consequently, careful analysis is required if it is safe to
|
||||
pass untrusted data to another program.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Processes-Fork-Parallel">
|
||||
<title><function>fork</function> as a Primitive for Parallelism</title>
|
||||
<para>
|
||||
A call to <function>fork</function> which is not immediately
|
||||
followed by a call to <function>execve</function> (perhaps after
|
||||
rearranging and closing file descriptors) is typically unsafe,
|
||||
especially from a library which does not control the state of
|
||||
the entire process. Such use of <function>fork</function>
|
||||
should be replaced with proper child processes or threads.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
</chapter>
|
|
@ -1,610 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-Serialization">
|
||||
<title>Serialization and Deserialization</title>
|
||||
<para>
|
||||
Protocol decoders and file format parsers are often the
|
||||
most-exposed part of an application because they are exposed with
|
||||
little or no user interaction and before any authentication and
|
||||
security checks are made. They are also difficult to write
|
||||
robustly in languages which are not memory-safe.
|
||||
</para>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-Decoders">
|
||||
<title>Recommendations for Manually-written Decoders</title>
|
||||
<para>
|
||||
For C and C++, the advice in <xref
|
||||
linkend="sect-Defensive_Coding-C-Pointers"/> applies. In
|
||||
addition, avoid non-character pointers directly into input
|
||||
buffers. Pointer misalignment causes crashes on some
|
||||
architectures.
|
||||
</para>
|
||||
<para>
|
||||
When reading variable-sized objects, do not allocate large
|
||||
amounts of data solely based on the value of a size field. If
|
||||
possible, grow the data structure as more data is read from the
|
||||
source, and stop when no data is available. This helps to avoid
|
||||
denial-of-service attacks where little amounts of input data
|
||||
results in enormous memory allocations during decoding.
|
||||
Alternatively, you can impose reasonable bounds on memory
|
||||
allocations, but some protocols do not permit this.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Protocol Design</title>
|
||||
<para>
|
||||
Binary formats with explicit length fields are more difficult to
|
||||
parse robustly than those where the length of dynamically-sized
|
||||
elements is derived from sentinel values. A protocol which does
|
||||
not use length fields and can be written in printable ASCII
|
||||
characters simplifies testing and debugging. However, binary
|
||||
protocols with length fields may be more efficient to parse.
|
||||
</para>
|
||||
<para>
|
||||
In new datagram-oriented protocols, unique numbers such as
|
||||
sequence numbers or identifiers for fragment reassembly (see
|
||||
<xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Serialization-Fragmentation"/>)
|
||||
should be at least 64 bits large, and really should not be
|
||||
smaller than 32 bits in size. Protocols should not permit
|
||||
fragments with overlapping contents.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-Fragmentation">
|
||||
<title>Fragmentation</title>
|
||||
<para>
|
||||
Some serialization formats use frames or protocol data units
|
||||
(PDUs) on lower levels which are smaller than the PDUs on higher
|
||||
levels. With such an architecture, higher-level PDUs may have
|
||||
to be <emphasis>fragmented</emphasis> into smaller frames during
|
||||
serialization, and frames may need
|
||||
<emphasis>reassembly</emphasis> into large PDUs during
|
||||
deserialization.
|
||||
</para>
|
||||
<para>
|
||||
Serialization formats may use conceptually similar structures
|
||||
for completely different purposes, for example storing multiple
|
||||
layers and color channels in a single image file.
|
||||
</para>
|
||||
<para>
|
||||
When fragmenting PDUs, establish a reasonable lower bound for
|
||||
the size of individual fragments (as large as possible—limits as
|
||||
low as one or even zero can add substantial overhead). Avoid
|
||||
fragmentation if at all possible, and try to obtain the maximum
|
||||
acceptable fragment length from a trusted data source.
|
||||
</para>
|
||||
<para>
|
||||
When implementing reassembly, consider the following aspects.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Avoid allocating significant amount of resources without
|
||||
proper authentication. Allocate memory for the unfragmented
|
||||
PDU as more and more and fragments are encountered, and not
|
||||
based on the initially advertised unfragmented PDU size,
|
||||
unless there is a sufficiently low limit on the unfragmented
|
||||
PDU size, so that over-allocation cannot lead to performance
|
||||
problems.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Reassembly queues on top of datagram-oriented transports
|
||||
should be bounded, both in the combined size of the arrived
|
||||
partial PDUs waiting for reassembly, and the total number of
|
||||
partially reassembled fragments. The latter limit helps to
|
||||
reduce the risk of accidental reassembly of unrelated
|
||||
fragments, as it can happen with small fragment IDs (see
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-Serialization-Fragmentation-ID"/>).
|
||||
It also guards to some extent against deliberate injection of fragments,
|
||||
by guessing fragment IDs.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Carefully keep track of which bytes in the unfragmented PDU
|
||||
have been covered by fragments so far. If message
|
||||
reordering is a concern, the most straightforward data
|
||||
structure for this is an array of bits, with one bit for
|
||||
every byte (or other atomic unit) in the unfragmented PDU.
|
||||
Complete reassembly can be determined by increasing a
|
||||
counter of set bits in the bit array as the bit array is
|
||||
updated, taking overlapping fragments into consideration.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Reject overlapping fragments (that is, multiple fragments
|
||||
which provide data at the same offset of the PDU being
|
||||
fragmented), unless the protocol explicitly requires
|
||||
accepting overlapping fragments. The bit array used for
|
||||
tracking already arrived bytes can be used for this purpose.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Check for conflicting values of unfragmented PDU lengths (if
|
||||
this length information is part of every fragment) and
|
||||
reject fragments which are inconsistent.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Validate fragment lengths and offsets of individual
|
||||
fragments against the unfragmented PDU length (if they are
|
||||
present). Check that the last byte in the fragment does not
|
||||
lie after the end of the unfragmented PDU. Avoid integer
|
||||
overflows in these computations (see <xref
|
||||
linkend="sect-Defensive_Coding-C-Arithmetic"/>).
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-Fragmentation-ID">
|
||||
<title>Fragment IDs</title>
|
||||
<para>
|
||||
If the underlying transport is datagram-oriented (so that PDUs
|
||||
can be reordered, duplicated or be lost, like with UDP),
|
||||
fragment reassembly needs to take into account endpoint
|
||||
addresses of the communication channel, and there has to be
|
||||
some sort of fragment ID which identifies the individual
|
||||
fragments as part of a larger PDU. In addition, the
|
||||
fragmentation protocol will typically involve fragment offsets
|
||||
and fragment lengths, as mentioned above.
|
||||
</para>
|
||||
<para>
|
||||
If the transport may be subject to blind PDU injection (again,
|
||||
like UDP), the fragment ID must be generated randomly. If the
|
||||
fragment ID is 64 bit or larger (strongly recommended), it can
|
||||
be generated in a completely random fashion for most traffic
|
||||
volumes. If it is less than 64 bits large (so that accidental
|
||||
collisions can happen if a lot of PDUs are transmitted), the
|
||||
fragment ID should be incremented sequentially from a starting
|
||||
value. The starting value should be derived using a HMAC-like
|
||||
construction from the endpoint addresses, using a long-lived
|
||||
random key. This construction ensures that despite the
|
||||
limited range of the ID, accidental collisions are as unlikely
|
||||
as possible. (This will not work reliable with really short
|
||||
fragment IDs, such as the 16 bit IDs used by the Internet
|
||||
Protocol.)
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title id="sect-Defensive_Coding-Tasks-Serialization-Library">Library
|
||||
Support for Deserialization</title>
|
||||
<para>
|
||||
For some languages, generic libraries are available which allow
|
||||
to serialize and deserialize user-defined objects. The
|
||||
deserialization part comes in one of two flavors, depending on
|
||||
the library. The first kind uses type information in the data
|
||||
stream to control which objects are instantiated. The second
|
||||
kind uses type definitions supplied by the programmer. The
|
||||
first one allows arbitrary object instantiation, the second one
|
||||
generally does not.
|
||||
</para>
|
||||
<para>
|
||||
The following serialization frameworks are in the first category,
|
||||
are known to be unsafe, and must not be used for untrusted data:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem><para>
|
||||
Python's <package>pickle</package> and <package>cPickle</package>
|
||||
modules, and wrappers such as <package>shelve</package>
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Perl's <package>Storable</package> package
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Java serialization (<type>java.io.ObjectInputStream</type>),
|
||||
even if encoded in other formats (as with
|
||||
<type>java.beans.XMLDecoder</type>)
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
PHP serialization (<function>unserialize</function>)
|
||||
</para></listitem>
|
||||
<listitem><para>
|
||||
Most implementations of YAML
|
||||
</para></listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
When using a type-directed deserialization format where the
|
||||
types of the deserialized objects are specified by the
|
||||
programmer, make sure that the objects which can be instantiated
|
||||
cannot perform any destructive actions in their destructors,
|
||||
even when the data members have been manipulated.
|
||||
</para>
|
||||
<para>
|
||||
In general, JSON decoders do not suffer from this problem. But
|
||||
you must not use the <function>eval</function> function to parse
|
||||
JSON objects in Javascript; even with the regular expression
|
||||
filter from RFC 4627, there are still information leaks
|
||||
remaining. JSON-based formats can still turn out risky if they
|
||||
serve as an encoding form for any if the serialization
|
||||
frameworks listed above.
|
||||
</para>
|
||||
<para>
|
||||
For serialization in C and C++ projects, the Protocol Buffers serialization
|
||||
(<package>protobuf</package>) provides type safe automated serialization
|
||||
by relying on code generation. It is positioned as similar, but simpler and
|
||||
more efficient to XML serialization.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML">
|
||||
<title>XML Serialization</title>
|
||||
<para>
|
||||
</para>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-External">
|
||||
<title>External References</title>
|
||||
<para>
|
||||
XML documents can contain external references. They can occur
|
||||
in various places.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
In the DTD declaration in the header of an XML document:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="XML">
|
||||
<![CDATA[<!DOCTYPE html PUBLIC
|
||||
"-//W3C//DTD XHTML 1.0 Transitional//EN"
|
||||
"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">]]>
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
In a namespace declaration:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="XML">
|
||||
<![CDATA[<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">]]>
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
In an entity defintion:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="XML">
|
||||
<![CDATA[<!ENTITY sys SYSTEM "http://www.example.com/ent.xml">
|
||||
<!ENTITY pub PUBLIC "-//Example//Public Entity//EN"
|
||||
"http://www.example.com/pub-ent.xml">]]>
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
In a notation:
|
||||
</para>
|
||||
<informalexample>
|
||||
<programlisting language="XML">
|
||||
<![CDATA[<!NOTATION not SYSTEM "../not.xml">]]>
|
||||
</programlisting>
|
||||
</informalexample>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
Originally, these external references were intended as unique
|
||||
identifiers, but by many XML implementations, they are used
|
||||
for locating the data for the referenced element. This causes
|
||||
unwanted network traffic, and may disclose file system
|
||||
contents or otherwise unreachable network resources, so this
|
||||
functionality should be disabled.
|
||||
</para>
|
||||
<para>
|
||||
Depending on the XML library, external referenced might be
|
||||
processed not just when parsing XML, but also when generating
|
||||
it.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-Entities">
|
||||
<title>Entity Expansion</title>
|
||||
<para>
|
||||
When external DTD processing is disabled, an internal DTD
|
||||
subset can still contain entity definitions. Entity
|
||||
declarations can reference other entities. Some XML libraries
|
||||
expand entities automatically, and this processing cannot be
|
||||
switched off in some places (such as attribute values or
|
||||
content models). Without limits on the entity nesting level,
|
||||
this expansion results in data which can grow exponentially in
|
||||
length with size of the input. (If there is a limit on the
|
||||
nesting level, the growth is still polynomial, unless further
|
||||
limits are imposed.)
|
||||
</para>
|
||||
<para>
|
||||
Consequently, the processing internal DTD subsets should be
|
||||
disabled if possible, and only trusted DTDs should be
|
||||
processed. If a particular XML application does not permit
|
||||
such restrictions, then application-specific limits are called
|
||||
for.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-XInclude">
|
||||
<title>XInclude Processing</title>
|
||||
<para>
|
||||
XInclude processing can reference file and network resources
|
||||
and include them into the document, much like external entity
|
||||
references. When parsing untrusted XML documents, XInclude
|
||||
processing should be turned off.
|
||||
</para>
|
||||
<para>
|
||||
XInclude processing is also fairly complex and may pull in
|
||||
support for the XPointer and XPath specifications,
|
||||
considerably increasing the amount of code required for XML
|
||||
processing.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-Validation">
|
||||
<title>Algorithmic Complexity of XML Validation</title>
|
||||
<para>
|
||||
DTD-based XML validation uses regular expressions for content
|
||||
models. The XML specification requires that content models
|
||||
are deterministic, which means that efficient validation is
|
||||
possible. However, some implementations do not enforce
|
||||
determinism, and require exponential (or just polynomial)
|
||||
amount of space or time for validating some DTD/document
|
||||
combinations.
|
||||
</para>
|
||||
<para>
|
||||
XML schemas and RELAX NG (via the <literal>xsd:</literal>
|
||||
prefix) directly support textual regular expressions which are
|
||||
not required to be deterministic.
|
||||
</para>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-Expat">
|
||||
<title>Using Expat for XML parsing</title>
|
||||
<para>
|
||||
By default, Expat does not try to resolve external IDs, so no
|
||||
steps are required to block them. However, internal entity
|
||||
declarations are processed. Installing a callback which stops
|
||||
parsing as soon as such entities are encountered disables
|
||||
them, see <xref
|
||||
linkend="ex-Defensive_Coding-Tasks-Serialization-XML-Expat-EntityDeclHandler"/>.
|
||||
Expat does not perform any validation, so there are no
|
||||
problems related to that.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-Expat-EntityDeclHandler">
|
||||
<title>Disabling XML entity processing with Expat</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-Expat-EntityDeclHandler.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
This handler must be installed when the
|
||||
<literal>XML_Parser</literal> object is created (<xref
|
||||
linkend="ex-Defensive_Coding-Tasks-Serialization-XML-Expat-Create"/>).
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-Expat-Create">
|
||||
<title>Creating an Expat XML parser</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-Expat-Create.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
It is also possible to reject internal DTD subsets altogether,
|
||||
using a suitable
|
||||
<literal>XML_StartDoctypeDeclHandler</literal> handler
|
||||
installed with <function>XML_SetDoctypeDeclHandler</function>.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-Qt">
|
||||
<title>Using Qt for XML Parsing</title>
|
||||
<para>
|
||||
The XML component of Qt, QtXml, does not resolve external IDs
|
||||
by default, so it is not required to prevent such resolution.
|
||||
Internal entities are processed, though. To change that, a
|
||||
custom <literal>QXmlDeclHandler</literal> and
|
||||
<literal>QXmlSimpleReader</literal> subclasses are needed. It
|
||||
is not possible to use the
|
||||
<function>QDomDocument::setContent(const QByteArray
|
||||
&)</function> convenience methods.
|
||||
</para>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-NoEntityHandler"/>
|
||||
shows an entity handler which always returns errors, causing
|
||||
parsing to stop when encountering entity declarations.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-NoEntityHandler">
|
||||
<title>A QtXml entity handler which blocks entity processing</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-Qt-NoEntityHandler.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
This handler is used in the custom
|
||||
<literal>QXmlReader</literal> subclass in <xref
|
||||
linkend="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-NoEntityReader"/>.
|
||||
Some parts of QtXml will call the
|
||||
<function>setDeclHandler(QXmlDeclHandler *)</function> method.
|
||||
Consequently, we prevent overriding our custom handler by
|
||||
providing a definition of this method which does nothing. In
|
||||
the constructor, we activate namespace processing; this part
|
||||
may need adjusting.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-NoEntityReader">
|
||||
<title>A QtXml XML reader which blocks entity processing</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-Qt-NoEntityReader.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
Our <literal>NoEntityReader</literal> class can be used with
|
||||
one of the overloaded
|
||||
<function>QDomDocument::setContent</function> methods.
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-QDomDocument"/>
|
||||
shows how the <literal>buffer</literal> object (of type
|
||||
<literal>QByteArray</literal>) is wrapped as a
|
||||
<literal>QXmlInputSource</literal>. After calling the
|
||||
<function>setContent</function> method, you should check the
|
||||
return value and report any error.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-Qt-QDomDocument">
|
||||
<title>Parsing an XML document with QDomDocument, without entity expansion</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-Qt-QDomDocument.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse">
|
||||
<title>Using OpenJDK for XML Parsing and Validation</title>
|
||||
<para>
|
||||
OpenJDK contains facilities for DOM-based, SAX-based, and
|
||||
StAX-based document parsing. Documents can be validated
|
||||
against DTDs or XML schemas.
|
||||
</para>
|
||||
<para>
|
||||
The approach taken to deal with entity expansion differs from
|
||||
the general recommendation in <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Serialization-XML-Entities"/>.
|
||||
We enable the the feature flag
|
||||
<literal>javax.xml.XMLConstants.FEATURE_SECURE_PROCESSING</literal>,
|
||||
which enforces heuristic restrictions on the number of entity
|
||||
expansions. Note that this flag alone does not prevent
|
||||
resolution of external references (system IDs or public IDs),
|
||||
so it is slightly misnamed.
|
||||
</para>
|
||||
<para>
|
||||
In the following sections, we use helper classes to prevent
|
||||
external ID resolution.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-NoEntityResolver">
|
||||
<title>Helper class to prevent DTD external entity resolution in OpenJDK</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK-NoEntityResolver.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-NoResourceResolver">
|
||||
<title>Helper class to prevent schema resolution in
|
||||
OpenJDK</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK-NoResourceResolver.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-Imports"/>
|
||||
shows the imports used by the examples.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-Imports">
|
||||
<title>Java imports for OpenJDK XML parsing</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK-Imports.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-DOM">
|
||||
<title>DOM-based XML parsing and DTD validation in OpenJDK</title>
|
||||
<para>
|
||||
This approach produces a
|
||||
<literal>org.w3c.dom.Document</literal> object from an input
|
||||
stream. <xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-DOM"/>
|
||||
use the data from the <literal>java.io.InputStream</literal>
|
||||
instance in the <literal>inputStream</literal> variable.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-DOM">
|
||||
<title>DOM-based XML parsing in OpenJDK</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK_Parse-DOM.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
External entity references are prohibited using the
|
||||
<literal>NoEntityResolver</literal> class in
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-NoEntityResolver"/>.
|
||||
Because external DTD references are prohibited, DTD validation
|
||||
(if enabled) will only happen against the internal DTD subset
|
||||
embedded in the XML document.
|
||||
</para>
|
||||
<para>
|
||||
To validate the document against an external DTD, use a
|
||||
<literal>javax.xml.transform.Transformer</literal> class to
|
||||
add the DTD reference to the document, and an entity
|
||||
resolver which whitelists this external reference.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-SAX">
|
||||
<title>XML Schema Validation in OpenJDK</title>
|
||||
<para>
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_SAX"/>
|
||||
shows how to validate a document against an XML Schema,
|
||||
using a SAX-based approach. The XML data is read from an
|
||||
<literal>java.io.InputStream</literal> in the
|
||||
<literal>inputStream</literal> variable.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_SAX">
|
||||
<title>SAX-based validation against an XML schema in
|
||||
OpenJDK</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_SAX.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
<para>
|
||||
The <literal>NoResourceResolver</literal> class is defined
|
||||
in <xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK-NoResourceResolver"/>.
|
||||
</para>
|
||||
<para>
|
||||
If you need to validate a document against an XML schema,
|
||||
use the code in <xref
|
||||
linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-DOM"/>
|
||||
to create the document, but do not enable validation at this
|
||||
point. Then use
|
||||
<xref linkend="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_DOM"/>
|
||||
to perform the schema-based validation on the
|
||||
<literal>org.w3c.dom.Document</literal> instance
|
||||
<literal>document</literal>.
|
||||
</para>
|
||||
<example id="ex-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_DOM">
|
||||
<title>Validation of a DOM document against an XML schema in
|
||||
OpenJDK</title>
|
||||
<xi:include href="snippets/Tasks-Serialization-XML-OpenJDK_Parse-XMLSchema_DOM.xml"
|
||||
xmlns:xi="http://www.w3.org/2001/XInclude" />
|
||||
</example>
|
||||
</section>
|
||||
<section id="sect-Defensive_Coding-Tasks-Serialization-XML-OpenJDK_Parse-Other">
|
||||
<title>Other XML Parsers in OpenJDK</title>
|
||||
<para>
|
||||
OpenJDK contains additional XML parsing and processing
|
||||
facilities. Some of them are insecure.
|
||||
</para>
|
||||
<para>
|
||||
The class <type>java.beans.XMLDecoder</type> acts as a
|
||||
bridge between the Java object serialization format and XML.
|
||||
It is close to impossible to securely deserialize Java
|
||||
objects in this format from untrusted inputs, so its use is
|
||||
not recommended, as with the Java object serialization
|
||||
format itself. See <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-Serialization-Library"/>.
|
||||
</para>
|
||||
</section>
|
||||
</section>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Protocol Encoders</title>
|
||||
<para>
|
||||
For protocol encoders, you should write bytes to a buffer which
|
||||
grows as needed, using an exponential sizing policy. Explicit
|
||||
lengths can be patched in later, once they are known.
|
||||
Allocating the required number of bytes upfront typically
|
||||
requires separate code to compute the final size, which must be
|
||||
kept in sync with the actual encoding step, or vulnerabilities
|
||||
may result. In multi-threaded code, parts of the object being
|
||||
deserialized might change, so that the computed size is out of
|
||||
date.
|
||||
</para>
|
||||
<para>
|
||||
You should avoid copying data directly from a received packet
|
||||
during encoding, disregarding the format. Propagating malformed
|
||||
data could enable attacks on other recipients of that data.
|
||||
</para>
|
||||
<para>
|
||||
When using C or C++ and copying whole data structures directly
|
||||
into the output, make sure that you do not leak information in
|
||||
padding bytes between fields or at the end of the
|
||||
<literal>struct</literal>.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
</chapter>
|
||||
|
|
@ -1,257 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE chapter PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Tasks-Temporary_Files">
|
||||
<title>Temporary Files</title>
|
||||
<para>
|
||||
In this chapter, we describe how to create temporary files and
|
||||
directories, how to remove them, and how to work with programs
|
||||
which do not create files in ways that are safe with a shared
|
||||
directory for temporary files. General file system manipulation
|
||||
is treated in a separate chapter, <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-File_System"/>.
|
||||
</para>
|
||||
<para>
|
||||
Secure creation of temporary files has four different aspects.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The location of the directory for temporary files must be
|
||||
obtained in a secure manner (that is, untrusted environment
|
||||
variables must be ignored, see <xref
|
||||
linkend="sect-Defensive_Coding-Tasks-secure_getenv"/>).
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
A new file must be created. Reusing an existing file must be
|
||||
avoided (the <filename class="directory">/tmp</filename> race
|
||||
condition). This is tricky because traditionally, system-wide
|
||||
temporary directories shared by all users are used.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The file must be created in a way that makes it impossible for
|
||||
other users to open it.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The descriptor for the temporary file should not leak to
|
||||
subprocesses.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
All functions mentioned below will take care of these aspects.
|
||||
</para>
|
||||
<para>
|
||||
Traditionally, temporary files are often used to reduce memory
|
||||
usage of programs. More and more systems use RAM-based file
|
||||
systems such as <literal>tmpfs</literal> for storing temporary
|
||||
files, to increase performance and decrease wear on Flash storage.
|
||||
As a result, spooling data to temporary files does not result in
|
||||
any memory savings, and the related complexity can be avoided if
|
||||
the data is kept in process memory.
|
||||
</para>
|
||||
|
||||
<section id="chap-Defensive_Coding-Tasks-Temporary_Files-Location">
|
||||
<title>Obtaining the Location of Temporary Directory</title>
|
||||
<para>
|
||||
Some functions below need the location of a directory which
|
||||
stores temporary files. For C/C++ programs, use the following
|
||||
steps to obtain that directory:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Use <function>secure_getenv</function> to obtain the value
|
||||
of the <literal>TMPDIR</literal> environment variable. If
|
||||
it is set, convert the path to a fully-resolved absolute
|
||||
path, using <literal>realpath(path, NULL)</literal>. Check
|
||||
if the new path refers to a directory and is writeable. In
|
||||
this case, use it as the temporary directory.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Fall back to <filename class="directory">/tmp</filename>.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
In Python, you can use the <varname>tempfile.tempdir</varname>
|
||||
variable.
|
||||
</para>
|
||||
<para>
|
||||
Java does not support SUID/SGID programs, so you can use the
|
||||
<function>java.lang.System.getenv(String)</function> method to
|
||||
obtain the value of the <literal>TMPDIR</literal> environment
|
||||
variable, and follow the two steps described above. (Java's
|
||||
default directory selection does not honor
|
||||
<literal>TMPDIR</literal>.)
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Named Temporary Files</title>
|
||||
<para>
|
||||
The <function>mkostemp</function> function creates a named
|
||||
temporary file. You should specify the
|
||||
<literal>O_CLOEXEC</literal> flag to avoid file descriptor leaks
|
||||
to subprocesses. (Applications which do not use multiple threads
|
||||
can also use <function>mkstemp</function>, but libraries should
|
||||
use <function>mkostemp</function>.) For determining the
|
||||
directory part of the file name pattern, see <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-Temporary_Files-Location"/>.
|
||||
</para>
|
||||
<para>
|
||||
The file is not removed automatically. It is not safe to rename
|
||||
or delete the file before processing, or transform the name in
|
||||
any way (for example, by adding a file extension). If you need
|
||||
multiple temporary files, call <function>mkostemp</function>
|
||||
multiple times. Do not create additional file names derived
|
||||
from the name provided by a previous
|
||||
<function>mkostemp</function> call. However, it is safe to close
|
||||
the descriptor returned by <function>mkostemp</function> and
|
||||
reopen the file using the generated name.
|
||||
</para>
|
||||
<para>
|
||||
The Python class <literal>tempfile.NamedTemporaryFile</literal>
|
||||
provides similar functionality, except that the file is deleted
|
||||
automatically by default. Note that you may have to use the
|
||||
<literal>file</literal> attribute to obtain the actual file
|
||||
object because some programming interfaces cannot deal with
|
||||
file-like objects. The C function <function>mkostemp</function>
|
||||
is also available as <function>tempfile.mkstemp</function>.
|
||||
</para>
|
||||
<para>
|
||||
In Java, you can use the
|
||||
<function>java.io.File.createTempFile(String, String,
|
||||
File)</function> function, using the temporary file location
|
||||
determined according to <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-Temporary_Files-Location"/>.
|
||||
Do not use <function>java.io.File.deleteOnExit()</function> to
|
||||
delete temporary files, and do not register a shutdown hook for
|
||||
each temporary file you create. In both cases, the deletion
|
||||
hint cannot be removed from the system if you delete the
|
||||
temporary file prior to termination of the VM, causing a memory
|
||||
leak.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Temporary Files without Names</title>
|
||||
<para>
|
||||
The <function>tmpfile</function> function creates a temporary
|
||||
file and immediately deletes it, while keeping the file open.
|
||||
As a result, the file lacks a name and its space is deallocated
|
||||
as soon as the file descriptor is closed (including the implicit
|
||||
close when the process terminates). This avoids cluttering the
|
||||
temporary directory with orphaned files.
|
||||
</para>
|
||||
<para>
|
||||
Alternatively, if the maximum size of the temporary file is
|
||||
known beforehand, the <function>fmemopen</function> function can
|
||||
be used to create a <literal>FILE *</literal> object which is
|
||||
backed by memory.
|
||||
</para>
|
||||
<para>
|
||||
In Python, unnamed temporary files are provided by the
|
||||
<literal>tempfile.TemporaryFile</literal> class, and the
|
||||
<literal>tempfile.SpooledTemporaryFile</literal> class provides
|
||||
a way to avoid creation of small temporary files.
|
||||
</para>
|
||||
<para>
|
||||
Java does not support unnamed temporary files.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section id="chap-Defensive_Coding-Tasks-Temporary_Directory">
|
||||
<title>Temporary Directories</title>
|
||||
<para>
|
||||
The <function>mkdtemp</function> function can be used to create
|
||||
a temporary directory. (For determining the directory part of
|
||||
the file name pattern, see <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-Temporary_Files-Location"/>.)
|
||||
The directory is not automatically removed. In Python, this
|
||||
function is available as <function>tempfile.mkdtemp</function>.
|
||||
In Java 7, temporary directories can be created using the
|
||||
<function>java.nio.file.Files.createTempDirectory(Path, String,
|
||||
FileAttribute...)</function> function.
|
||||
</para>
|
||||
<para>
|
||||
When creating files in the temporary directory, use
|
||||
automatically generated names, e.g., derived from a sequential
|
||||
counter. Files with externally provided names could be picked
|
||||
up in unexpected contexts, and crafted names could actually
|
||||
point outside of the tempoary directory (due to
|
||||
<emphasis>directory traversal</emphasis>).
|
||||
</para>
|
||||
<para>
|
||||
Removing a directory tree in a completely safe manner is
|
||||
complicated. Unless there are overriding performance concerns,
|
||||
the <application>rm</application> program should be used, with
|
||||
the <option>-rf</option> and <option>--</option> options.
|
||||
</para>
|
||||
</section>
|
||||
|
||||
<section>
|
||||
<title>Compensating for Unsafe File Creation</title>
|
||||
<para>
|
||||
There are two ways to make a function or program which excepts a
|
||||
file name safe for use with temporary files. See
|
||||
<xref linkend="sect-Defensive_Coding-Tasks-Processes-Creation"/>,
|
||||
for details on subprocess creation.
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Create a temporary directory and place the file there. If
|
||||
possible, run the program in a subprocess which uses the
|
||||
temporary directory as its current directory, with a
|
||||
restricted environment.
|
||||
Use generated names for all files in that temporary
|
||||
directory. (See <xref
|
||||
linkend="chap-Defensive_Coding-Tasks-Temporary_Directory"/>.)
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Create the temporary file and pass the generated file name
|
||||
to the function or program. This only works if the function
|
||||
or program can cope with a zero-length existing file. It is
|
||||
safe only under additional assumptions:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
The function or program must not create additional files
|
||||
whose name is derived from the specified file name or
|
||||
are otherwise predictable.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
The function or program must not delete the file before
|
||||
processing it.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
It must not access any existing files in the same
|
||||
directory.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
<para>
|
||||
It is often difficult to check whether these additional
|
||||
assumptions are matched, therefore this approach is not
|
||||
recommended.
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</section>
|
||||
</chapter>
|
|
@ -1,53 +0,0 @@
|
|||
<?xml version='1.0' encoding='utf-8' ?>
|
||||
<!DOCTYPE section PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd" [
|
||||
]>
|
||||
<chapter id="chap-Defensive_Coding-Vala">
|
||||
<title>The Vala Programming Language</title>
|
||||
<para>
|
||||
Vala is a programming language mainly targeted at GNOME developers.
|
||||
</para>
|
||||
<para>
|
||||
Its syntax is inspired by C# (and thus, indirectly, by Java). But
|
||||
unlike C# and Java, Vala does not attempt to provide memory safety:
|
||||
Vala is compiled to C, and the C code is compiled with GCC using
|
||||
typical compiler flags. Basic operations like integer arithmetic
|
||||
are directly mapped to C constructs. As a results, the
|
||||
recommendations in <xref linkend="chap-Defensive_Coding-C"/> apply.
|
||||
</para>
|
||||
<para>
|
||||
In particular, the following Vala language constructs can result in
|
||||
undefined behavior at run time:
|
||||
</para>
|
||||
<itemizedlist>
|
||||
<listitem>
|
||||
<para>
|
||||
Integer arithmetic, as described in <xref
|
||||
linkend="sect-Defensive_Coding-C-Arithmetic"/>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Pointer arithmetic, string subscripting and the
|
||||
<literal>substring</literal> method on strings (the
|
||||
<literal>string</literal> class in the
|
||||
<literal>glib-2.0</literal> package) are not range-checked. It
|
||||
is the responsibility of the calling code to ensure that the
|
||||
arguments being passed are valid. This applies even to cases
|
||||
(like <literal>substring</literal>) where the implementation
|
||||
would have range information to check the validity of indexes.
|
||||
See <xref linkend="sect-Defensive_Coding-C-Pointers"/>.
|
||||
</para>
|
||||
</listitem>
|
||||
<listitem>
|
||||
<para>
|
||||
Similarly, Vala only performs garbage collection (through
|
||||
reference counting) for <literal>GObject</literal> values. For
|
||||
plain C pointers (such as strings), the programmer has to ensure
|
||||
that storage is deallocated once it is no longer needed (to
|
||||
avoid memory leaks), and that storage is not being deallocated
|
||||
while it is still being used (see <xref
|
||||
linkend="sect-Defensive_Coding-C-Use-After-Free"/>).
|
||||
</para>
|
||||
</listitem>
|
||||
</itemizedlist>
|
||||
</chapter>
|
File diff suppressed because it is too large
Load diff
File diff suppressed because it is too large
Load diff
Before Width: | Height: | Size: 108 KiB |
|
@ -1,4 +0,0 @@
|
|||
<?xml version="1.0"?>
|
||||
<locatingRules xmlns="http://thaiopensource.com/ns/locating-rules/1.0">
|
||||
<include rules="../schemas.xml"/>
|
||||
</locatingRules>
|
10
publican.cfg
10
publican.cfg
|
@ -1,10 +0,0 @@
|
|||
xml_lang: en-US
|
||||
brand: fedora
|
||||
chunk_section_depth: 3
|
||||
#product: Defensive_Coding
|
||||
#mainfile: Defensive_Coding
|
||||
#docname: Defensive_Coding
|
||||
web_version_label: UNUSED
|
||||
version: 1
|
||||
#git_branch: eng-docs-rhel-6
|
||||
doc_url: https://gitlab.com/redhat-sectech/defensive-coding-guide
|
|
@ -1,6 +0,0 @@
|
|||
<?xml version="1.0"?>
|
||||
<locatingRules xmlns="http://thaiopensource.com/ns/locating-rules/1.0">
|
||||
<documentElement localName="book" uri="docbook-schema/docbook.rnc"/>
|
||||
<documentElement localName="chapter" uri="docbook-schema/docbook.rnc"/>
|
||||
<documentElement localName="section" uri="docbook-schema/docbook.rnc"/>
|
||||
</locatingRules>
|
Loading…
Add table
Add a link
Reference in a new issue