|
Server : Apache/2.2.2 (Fedora) System : Linux App1.pathumtani.go.th 2.6.20-1.2320.fc5smp #1 SMP Tue Jun 12 19:40:16 EDT 2007 i686 User : apache ( 48) PHP Version : 5.2.9 Disable Function : NONE Directory : /proc/self/root/proc/self/root/usr/lib/python2.4/site-packages/yum/ |
Upload File : |
#!/usr/bin/python -tt
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Library General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
# Copyright 2004 Duke University
import os
import os.path
import re
import fnmatch
import urlparse
import types
import time
import Errors
from urlgrabber.grabber import URLGrabber
import urlgrabber.mirror
from urlgrabber.grabber import URLGrabError
from repomd import repoMDObject
from repomd import mdErrors
from repomd import packageSack
from packages import YumAvailablePackage
import mdcache
import parser
_is_fnmatch_pattern = re.compile(r"[*?[]").search
class YumPackageSack(packageSack.PackageSack):
"""imports/handles package objects from an mdcache dict object"""
def __init__(self, packageClass):
packageSack.PackageSack.__init__(self)
self.pc = packageClass
self.added = {}
def addDict(self, repoid, datatype, dataobj, callback=None):
if self.added.has_key(repoid):
if datatype in self.added[repoid]:
return
total = len(dataobj.keys())
if datatype == 'metadata':
current = 0
for pkgid in dataobj.keys():
current += 1
if callback: callback.progressbar(current, total, repoid)
pkgdict = dataobj[pkgid]
po = self.pc(pkgdict, repoid)
po.simple['id'] = pkgid
self._addToDictAsList(self.pkgsByID, pkgid, po)
self.addPackage(po)
if not self.added.has_key(repoid):
self.added[repoid] = []
self.added[repoid].append('metadata')
# indexes will need to be rebuilt
self.indexesBuilt = 0
elif datatype in ['filelists', 'otherdata']:
if self.added.has_key(repoid):
if 'metadata' not in self.added[repoid]:
raise Errors.RepoError, '%s md for %s imported before primary' \
% (datatype, repoid)
current = 0
for pkgid in dataobj.keys():
current += 1
if callback: callback.progressbar(current, total, repoid)
pkgdict = dataobj[pkgid]
if self.pkgsByID.has_key(pkgid):
for po in self.pkgsByID[pkgid]:
po.importFromDict(pkgdict, repoid)
self.added[repoid].append(datatype)
# indexes will need to be rebuilt
self.indexesBuilt = 0
else:
# umm, wtf?
pass
class RepoStorage:
"""This class contains multiple repositories and core configuration data
about them."""
def __init__(self):
self.repos = {} # list of repos by repoid pointing a repo object
# of repo options/misc data
self.callback = None # progress callback used for populateSack() for importing the xml files
self.cache = 0
# Check to see if we can import sqlite stuff
try:
import sqlitecache
import sqlitesack
except ImportError:
self.sqlite = False
else:
self.sqlite = True
self.sqlitecache = sqlitecache
self._selectSackType()
def _selectSackType(self):
if (self.sqlite):
import sqlitecache
import sqlitesack
self.pkgSack = sqlitesack.YumSqlitePackageSack(sqlitesack.YumAvailablePackageSqlite)
else:
self.pkgSack = YumPackageSack(YumAvailablePackage)
def __str__(self):
return str(self.repos.keys())
def add(self, repoobj):
if self.repos.has_key(repoobj.id):
raise Errors.RepoError, 'Repository %s is listed more than once in the configuration' % (repoobj.id)
self.repos[repoobj.id] = repoobj
def delete(self, repoid):
if self.repos.has_key(repoid):
del self.repos[repoid]
def sort(self):
repolist = self.repos.values()
repolist.sort()
return repolist
def getRepo(self, repoid):
try:
return self.repos[repoid]
except KeyError, e:
raise Errors.RepoError, \
'Error getting repository data for %s, repository not found' % (repoid)
def findRepos(self,pattern):
"""find all repositories matching fnmatch `pattern`"""
result = []
for item in pattern.split(','):
item = item.strip()
match = re.compile(fnmatch.translate(item)).match
for name,repo in self.repos.items():
if match(name):
result.append(repo)
return result
def disableRepo(self, repoid):
"""disable a repository from use
fnmatch wildcards may be used to disable a group of repositories.
returns repoid of disabled repos as list
"""
repos = []
if _is_fnmatch_pattern(repoid) or repoid.find(',') != -1:
for repo in self.findRepos(repoid):
repos.append(repo.id)
repo.disable()
else:
thisrepo = self.getRepo(repoid)
repos.append(thisrepo.id)
thisrepo.disable()
return repos
def enableRepo(self, repoid):
"""enable a repository for use
fnmatch wildcards may be used to enable a group of repositories.
returns repoid of enables repos as list
"""
repos = []
if _is_fnmatch_pattern(repoid) or repoid.find(',') != -1:
for repo in self.findRepos(repoid):
repos.append(repo.id)
repo.enable()
else:
thisrepo = self.getRepo(repoid)
repos.append(thisrepo.id)
thisrepo.enable()
return repos
def listEnabled(self):
"""return list of enabled repo objects"""
returnlist = []
for repo in self.repos.values():
if repo.enabled:
returnlist.append(repo)
return returnlist
def listGroupsEnabled(self):
"""return a list of repo objects that have groups enabled"""
returnlist = []
for repo in self.listEnabled():
if repo.enablegroups:
returnlist.append(repo)
return returnlist
def setCache(self, cacheval):
"""sets cache value in all repos"""
self.cache = cacheval
for repo in self.repos.values():
repo.cache = cacheval
def setCacheDir(self, cachedir):
"""sets the cachedir value in all repos"""
for repo in self.repos.values():
repo.basecachedir = cachedir
def setProgressBar(self, obj):
"""set's the progress bar for downloading files from repos"""
for repo in self.repos.values():
repo.callback = obj
repo.setupGrab()
def setFailureCallback(self, obj):
"""set's the failure callback for all repos"""
for repo in self.repos.values():
repo.failure_obj = obj
repo.setupGrab()
def populateSack(self, which='enabled', with='metadata', callback=None, pickleonly=0):
"""This populates the package sack from the repositories, two optional
arguments: which='repoid, enabled, all'
with='metadata, filelists, otherdata, all'"""
if not callback:
callback = self.callback
myrepos = []
if which == 'enabled':
myrepos = self.listEnabled()
elif which == 'all':
myrepos = self.repos.values()
else:
if type(which) == types.ListType:
for repo in which:
if isinstance(repo, Repository):
myrepos.append(repo)
else:
repobj = self.getRepo(repo)
myrepos.append(repobj)
elif type(which) == types.StringType:
repobj = self.getRepo(which)
myrepos.append(repobj)
if with == 'all':
data = ['metadata', 'filelists', 'otherdata']
else:
data = [ with ]
for repo in myrepos:
if not hasattr(repo, 'cacheHandler'):
if (self.sqlite):
repo.cacheHandler = self.sqlitecache.RepodataParserSqlite(
storedir=repo.cachedir,
repoid=repo.id,
callback=callback,
)
else:
repo.cacheHandler = mdcache.RepodataParser(
storedir=repo.cachedir,
callback=callback
)
for item in data:
if self.pkgSack.added.has_key(repo.id):
if item in self.pkgSack.added[repo.id]:
continue
if item == 'metadata':
xml = repo.getPrimaryXML()
(ctype, csum) = repo.repoXML.primaryChecksum()
dobj = repo.cacheHandler.getPrimary(xml, csum)
if not pickleonly:
self.pkgSack.addDict(repo.id, item, dobj, callback)
del dobj
elif item == 'filelists':
xml = repo.getFileListsXML()
(ctype, csum) = repo.repoXML.filelistsChecksum()
dobj = repo.cacheHandler.getFilelists(xml, csum)
if not pickleonly:
self.pkgSack.addDict(repo.id, item, dobj, callback)
del dobj
elif item == 'otherdata':
xml = repo.getOtherXML()
(ctype, csum) = repo.repoXML.otherChecksum()
dobj = repo.cacheHandler.getOtherdata(xml, csum)
if not pickleonly:
self.pkgSack.addDict(repo.id, item, dobj, callback)
del dobj
else:
# how odd, just move along
continue
# get rid of all this stuff we don't need now
del repo.cacheHandler
class Repository:
"""this is an actual repository object"""
def __init__(self, repoid):
self.id = repoid
self.name = repoid # name is repoid until someone sets it to a real name
# some default (ish) things
self.urls = []
self.gpgcheck = 0
self.enabled = 0
self.enablegroups = 0
self.groupsfilename = 'yumgroups.xml' # something some freaks might
# eventually want
self.setkeys = []
self.repoMDFile = 'repodata/repomd.xml'
self.repoXML = None
self.cache = 0
self.callback = None # callback for the grabber
self.failure_obj = None
self.mirrorlist = None # filename/url of mirrorlist file
self.mirrorlistparsed = 0
self.baseurl = [] # baseurls from the config file
self.yumvar = {} # empty dict of yumvariables for $string replacement
self.proxy_password = None
self.proxy_username = None
self.proxy = None
self._proxy_dict = {}
self.metadata_cookie_fn = 'cachecookie'
self.groups_added = False
# throw in some stubs for things that will be set by the config class
self.basecachedir = ""
self.cachedir = ""
self.pkgdir = ""
self.hdrdir = ""
# holder for stuff we've grabbed
self.retrieved = { 'primary':0, 'filelists':0, 'other':0, 'groups':0 }
def __cmp__(self, other):
if self.id > other.id:
return 1
elif self.id < other.id:
return -1
else:
return 0
def __str__(self):
return self.id
def _checksum(self, sumtype, file, CHUNK=2**16):
"""takes filename, hand back Checksum of it
sumtype = md5 or sha
filename = /path/to/file
CHUNK=65536 by default"""
# chunking brazenly lifted from Ryan Tomayko
try:
if type(file) is not types.StringType:
fo = file # assume it's a file-like-object
else:
fo = open(file, 'r', CHUNK)
if sumtype == 'md5':
import md5
sum = md5.new()
elif sumtype == 'sha':
import sha
sum = sha.new()
else:
raise Errors.RepoError, 'Error Checksumming file, wrong \
checksum type %s' % sumtype
chunk = fo.read
while chunk:
chunk = fo.read(CHUNK)
sum.update(chunk)
if type(file) is types.StringType:
fo.close()
del fo
return sum.hexdigest()
except (EnvironmentError, IOError, OSError):
raise Errors.RepoError, 'Error opening file for checksum'
def dump(self):
output = '[%s]\n' % self.id
vars = ['name', 'bandwidth', 'enabled', 'enablegroups',
'gpgcheck', 'includepkgs', 'keepalive', 'proxy',
'proxy_password', 'proxy_username', 'exclude',
'retries', 'throttle', 'timeout', 'mirrorlist',
'cachedir', 'gpgkey', 'pkgdir', 'hdrdir']
vars.sort()
for attr in vars:
output = output + '%s = %s\n' % (attr, getattr(self, attr))
output = output + 'baseurl ='
for url in self.urls:
output = output + ' %s\n' % url
return output
def enable(self):
self.baseurlSetup()
self.set('enabled', 1)
def disable(self):
self.set('enabled', 0)
def check(self):
"""self-check the repo information - if we don't have enough to move
on then raise a repo error"""
if len(self.urls) < 1:
raise Errors.RepoError, \
'Cannot find a valid baseurl for repo: %s' % self.id
def set(self, key, value):
"""sets a generic attribute of this repository"""
self.setkeys.append(key)
setattr(self, key, value)
def unset(self, key):
"""delete an attribute of this repository"""
self.setkeys.remove(key)
delattr(self, key)
def listSetKeys(self):
return self.setkeys
def doProxyDict(self):
if self._proxy_dict:
return
self._proxy_dict = {} # zap it
proxy_string = None
if self.proxy not in [None, '_none_']:
proxy_string = '%s' % self.proxy
if self.proxy_username is not None:
proxy_parsed = urlparse.urlsplit(self.proxy, allow_fragments=0)
proxy_proto = proxy_parsed[0]
proxy_host = proxy_parsed[1]
proxy_rest = proxy_parsed[2] + '?' + proxy_parsed[3]
proxy_string = '%s://%s@%s%s' % (proxy_proto,
self.proxy_username, proxy_host, proxy_rest)
if self.proxy_password is not None:
proxy_string = '%s://%s:%s@%s%s' % (proxy_proto,
self.proxy_username, self.proxy_password,
proxy_host, proxy_rest)
if proxy_string is not None:
self._proxy_dict['http'] = proxy_string
self._proxy_dict['https'] = proxy_string
self._proxy_dict['ftp'] = proxy_string
def setupGrab(self):
"""sets up the grabber functions with the already stocked in urls for
the mirror groups"""
if self.failovermethod == 'roundrobin':
mgclass = urlgrabber.mirror.MGRandomOrder
else:
mgclass = urlgrabber.mirror.MirrorGroup
self.grabfunc = URLGrabber(keepalive=self.keepalive,
bandwidth=self.bandwidth,
retry=self.retries,
throttle=self.throttle,
progress_obj=self.callback,
proxies = self.proxy_dict,
failure_callback=self.failure_obj,
timeout=self.timeout,
reget='simple')
self.grab = mgclass(self.grabfunc, self.urls)
def dirSetup(self):
"""make the necessary dirs, if possible, raise on failure"""
cachedir = os.path.join(self.basecachedir, self.id)
pkgdir = os.path.join(cachedir, 'packages')
hdrdir = os.path.join(cachedir, 'headers')
self.set('cachedir', cachedir)
self.set('pkgdir', pkgdir)
self.set('hdrdir', hdrdir)
cookie = self.cachedir + '/' + self.metadata_cookie_fn
self.set('metadata_cookie', cookie)
for dir in [self.cachedir, self.hdrdir, self.pkgdir]:
if self.cache == 0:
if os.path.exists(dir) and os.path.isdir(dir):
continue
else:
try:
os.makedirs(dir, mode=0755)
except OSError, e:
raise Errors.RepoError, \
"Error making cache directory: %s error was: %s" % (dir, e)
else:
if not os.path.exists(dir):
raise Errors.RepoError, \
"Cannot access repository dir %s" % dir
def baseurlSetup(self):
"""go through the baseurls and mirrorlists and populate self.urls
with valid ones, run self.check() at the end to make sure it worked"""
goodurls = []
if self.mirrorlist and not self.mirrorlistparsed:
mirrorurls = getMirrorList(self.mirrorlist, self.proxy_dict)
self.mirrorlistparsed = 1
for url in mirrorurls:
url = parser.varReplace(url, self.yumvar)
self.baseurl.append(url)
for url in self.baseurl:
url = parser.varReplace(url, self.yumvar)
(s,b,p,q,f,o) = urlparse.urlparse(url)
if s not in ['http', 'ftp', 'file', 'https']:
print 'not using ftp, http[s], or file for repos, skipping - %s' % (url)
continue
else:
goodurls.append(url)
self.set('urls', goodurls)
self.check()
self.setupGrab() # update the grabber for the urls
def get(self, url=None, relative=None, local=None, start=None, end=None,
copy_local=0, checkfunc=None, text=None, reget='simple', cache=True):
"""retrieve file from the mirrorgroup for the repo
relative to local, optionally get range from
start to end, also optionally retrieve from a specific baseurl"""
# if local or relative is None: raise an exception b/c that shouldn't happen
# if url is not None - then do a grab from the complete url - not through
# the mirror, raise errors as need be
# if url is None do a grab via the mirror group/grab for the repo
# return the path to the local file
if cache:
headers = None
else:
headers = (('Pragma', 'no-cache'),)
if local is None or relative is None:
raise Errors.RepoError, \
"get request for Repo %s, gave no source or dest" % self.id
if self.failure_obj:
(f_func, f_args, f_kwargs) = self.failure_obj
self.failure_obj = (f_func, f_args, f_kwargs)
if self.cache == 1:
if os.path.exists(local): # FIXME - we should figure out a way
return local # to run the checkfunc from here
else: # ain't there - raise
raise Errors.RepoError, \
"Caching enabled but no local cache of %s from %s" % (local,
self)
if url is not None:
ug = URLGrabber(keepalive = self.keepalive,
bandwidth = self.bandwidth,
retry = self.retries,
throttle = self.throttle,
progres_obj = self.callback,
copy_local = copy_local,
reget = reget,
proxies = self.proxy_dict,
failure_callback = self.failure_obj,
timeout=self.timeout,
checkfunc=checkfunc,
http_headers=headers,
)
remote = url + '/' + relative
try:
result = ug.urlgrab(remote, local,
text=text,
range=(start, end),
)
except URLGrabError, e:
raise Errors.RepoError, \
"failed to retrieve %s from %s\nerror was %s" % (relative, self.id, e)
else:
try:
result = self.grab.urlgrab(relative, local,
text = text,
range = (start, end),
copy_local=copy_local,
reget = reget,
checkfunc=checkfunc,
http_headers=headers,
)
except URLGrabError, e:
raise Errors.RepoError, "failure: %s from %s: %s" % (relative, self.id, e)
return result
def metadataCurrent(self):
"""Check if there is a metadata_cookie and check its age. If the
age of the cookie is less than metadata_expire time then return true
else return False"""
val = False
if os.path.exists(self.metadata_cookie):
cookie_info = os.stat(self.metadata_cookie)
if cookie_info[8] + self.metadata_expire > time.time():
val = True
return val
def setMetadataCookie(self):
"""if possible, set touch the metadata_cookie file"""
check = self.metadata_cookie
if not os.path.exists(self.metadata_cookie):
check = self.cachedir
if os.access(check, os.W_OK):
fo = open(self.metadata_cookie, 'w+')
fo.close()
del fo
def getRepoXML(self, text=None):
"""retrieve/check/read in repomd.xml from the repository"""
remote = self.repoMDFile
local = self.cachedir + '/repomd.xml'
if self.repoXML is not None:
return
if self.cache or self.metadataCurrent():
if not os.path.exists(local):
raise Errors.RepoError, 'Cannot find repomd.xml file for %s' % (self)
else:
result = local
else:
checkfunc = (self._checkRepoXML, (), {})
try:
result = self.get(relative=remote,
local=local,
copy_local=1,
text=text,
reget=None,
checkfunc=checkfunc,
cache=self.http_caching == 'all')
except URLGrabError, e:
raise Errors.RepoError, 'Error downloading file %s: %s' % (local, e)
# if we have a 'fresh' repomd.xml then update the cookie
self.setMetadataCookie()
try:
self.repoXML = repoMDObject.RepoMD(self.id, result)
except mdErrors.RepoMDError, e:
raise Errors.RepoError, 'Error importing repomd.xml from %s: %s' % (self, e)
def _checkRepoXML(self, fo):
if type(fo) is types.InstanceType:
filepath = fo.filename
else:
filepath = fo
try:
foo = repoMDObject.RepoMD(self.id, filepath)
except mdErrors.RepoMDError, e:
raise URLGrabError(-1, 'Error importing repomd.xml for %s: %s' % (self, e))
def __getProxyDict(self):
self.doProxyDict()
if self._proxy_dict:
return self._proxy_dict
return None
# consistent access to how proxy information should look (and ensuring
# that it's actually determined for the repo)
proxy_dict = property(__getProxyDict)
def _checkMD(self, fn, mdtype):
"""check the metadata type against its checksum"""
csumDict = { 'primary' : self.repoXML.primaryChecksum,
'filelists' : self.repoXML.filelistsChecksum,
'other' : self.repoXML.otherChecksum,
'group' : self.repoXML.groupChecksum }
csumMethod = csumDict[mdtype]
(r_ctype, r_csum) = csumMethod() # get the remote checksum
if type(fn) == types.InstanceType: # this is an urlgrabber check
file = fn.filename
else:
file = fn
try:
l_csum = self._checksum(r_ctype, file) # get the local checksum
except Errors.RepoError, e:
raise URLGrabError(-3, 'Error performing checksum')
if l_csum == r_csum:
return 1
else:
raise URLGrabError(-1, 'Metadata file does not match checksum')
def _retrieveMD(self, mdtype):
"""base function to retrieve metadata files from the remote url
returns the path to the local metadata file of a 'mdtype'
mdtype can be 'primary', 'filelists', 'other' or 'group'."""
locDict = { 'primary' : self.repoXML.primaryLocation,
'filelists' : self.repoXML.filelistsLocation,
'other' : self.repoXML.otherLocation,
'group' : self.repoXML.groupLocation }
locMethod = locDict[mdtype]
(r_base, remote) = locMethod()
fname = os.path.basename(remote)
local = self.cachedir + '/' + fname
if self.retrieved.has_key(mdtype):
if self.retrieved[mdtype]: # got it, move along
return local
if self.cache == 1:
if os.path.exists(local):
try:
self._checkMD(local, mdtype)
except URLGrabError, e:
raise Errors.RepoError, \
"Caching enabled and local cache: %s does not match checksum" % local
else:
return local
else: # ain't there - raise
raise Errors.RepoError, \
"Caching enabled but no local cache of %s from %s" % (local,
self)
if os.path.exists(local):
try:
self._checkMD(local, mdtype)
except URLGrabError, e:
pass
else:
self.retrieved[mdtype] = 1
return local # it's the same return the local one
try:
checkfunc = (self._checkMD, (mdtype,), {})
local = self.get(relative=remote, local=local, copy_local=1,
checkfunc=checkfunc, reget=None,
cache=self.http_caching == 'all')
except URLGrabError, e:
raise Errors.RepoError, \
"Could not retrieve %s matching remote checksum from %s" % (local, self)
else:
self.retrieved[mdtype] = 1
return local
def getPrimaryXML(self):
"""this gets you the path to the primary.xml file, retrieving it if we
need a new one"""
return self._retrieveMD('primary')
def getFileListsXML(self):
"""this gets you the path to the filelists.xml file, retrieving it if we
need a new one"""
return self._retrieveMD('filelists')
def getOtherXML(self):
return self._retrieveMD('other')
def getGroups(self):
"""gets groups and returns group file path for the repository, if there
is none it returns None"""
try:
file = self._retrieveMD('group')
except URLGrabError:
file = None
return file
def getMirrorList(mirrorlist, pdict = None):
"""retrieve an up2date-style mirrorlist file from a url,
we also s/$ARCH/$BASEARCH/ and move along
returns a list of the urls from that file"""
returnlist = []
if hasattr(urlgrabber.grabber, 'urlopen'):
urlresolver = urlgrabber.grabber
else:
urlresolver = urllib
scheme = urlparse.urlparse(mirrorlist)[0]
if scheme == '':
url = 'file://' + mirrorlist
else:
url = mirrorlist
try:
fo = urlresolver.urlopen(url, proxies=pdict)
except urlgrabber.grabber.URLGrabError, e:
fo = None
if fo is not None:
content = fo.readlines()
for line in content:
if re.match('^\s*\#.*', line) or re.match('^\s*$', line):
continue
mirror = re.sub('\n$', '', line) # no more trailing \n's
(mirror, count) = re.subn('\$ARCH', '$BASEARCH', mirror)
returnlist.append(mirror)
return returnlist