2012-04-13 00:48:34 +02:00
|
|
|
#!/usr/bin/env python
|
|
|
|
# encoding: utf-8
|
|
|
|
# Hans-Martin von Gaudecker, 2012
|
|
|
|
|
|
|
|
"""
|
2012-04-13 18:32:34 +02:00
|
|
|
Run a Stata do-script in the directory specified by **ctx.bldnode**. The
|
|
|
|
first and only argument will be the name of the do-script (no extension),
|
|
|
|
which can be accessed inside the do-script by the local macro `1'. Useful
|
2012-04-13 00:48:34 +02:00
|
|
|
for keeping a log file.
|
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
The tool uses the log file that is automatically kept by Stata only
|
2012-04-13 00:48:34 +02:00
|
|
|
for error-catching purposes, it will be destroyed if the task finished
|
2012-04-13 18:32:34 +02:00
|
|
|
without error. In case of an error in **some_script.do**, you can inspect
|
|
|
|
it as **some_script.log** in the **ctx.bldnode** directory.
|
2012-04-13 00:48:34 +02:00
|
|
|
|
|
|
|
Note that Stata will not return an error code if it exits abnormally --
|
2012-04-13 18:32:34 +02:00
|
|
|
catching errors relies on parsing the log file mentioned before. Should
|
2012-04-13 00:48:34 +02:00
|
|
|
the parser behave incorrectly please send an email to hmgaudecker [at] gmail.
|
|
|
|
|
2012-04-13 08:36:02 +02:00
|
|
|
**WARNING**
|
2012-04-13 00:48:34 +02:00
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
The tool will not work if multiple do-scripts of the same name---but in
|
2012-04-13 00:48:34 +02:00
|
|
|
different directories---are run at the same time! Avoid this situation.
|
|
|
|
|
2012-04-13 08:36:02 +02:00
|
|
|
Usage::
|
2012-04-13 00:48:34 +02:00
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
ctx(features='run_do_script',
|
|
|
|
source='some_script.do',
|
2012-04-13 00:48:34 +02:00
|
|
|
target=['some_table.tex', 'some_figure.eps'],
|
|
|
|
deps='some_data.csv')
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
import os, re, sys
|
|
|
|
from waflib import Task, TaskGen, Logs
|
|
|
|
|
|
|
|
if sys.platform == 'darwin':
|
|
|
|
STATA_COMMANDS = ['Stata64MP', 'StataMP',
|
|
|
|
'Stata64SE', 'StataSE',
|
|
|
|
'Stata64', 'Stata']
|
|
|
|
STATAFLAGS = '-e -q do'
|
|
|
|
STATAENCODING = 'MacRoman'
|
|
|
|
elif sys.platform.startswith('linux'):
|
|
|
|
STATA_COMMANDS = ['stata-mp', 'stata-se', 'stata']
|
|
|
|
STATAFLAGS = '-b -q do'
|
|
|
|
# Not sure whether this is correct...
|
|
|
|
STATAENCODING = 'Latin-1'
|
|
|
|
elif sys.platform.lower().startswith('win'):
|
|
|
|
STATA_COMMANDS = ['StataMP-64', 'StataMP-ia',
|
|
|
|
'StataMP', 'StataSE-64',
|
|
|
|
'StataSE-ia', 'StataSE',
|
|
|
|
'Stata-64', 'Stata-ia',
|
|
|
|
'Stata.e', 'WMPSTATA',
|
|
|
|
'WSESTATA', 'WSTATA']
|
|
|
|
STATAFLAGS = '/e do'
|
|
|
|
STATAENCODING = 'Latin-1'
|
|
|
|
else:
|
|
|
|
raise Exception("Unknown sys.platform: %s " % sys.platform)
|
|
|
|
|
|
|
|
def configure(ctx):
|
|
|
|
ctx.find_program(STATA_COMMANDS, var='STATACMD', errmsg="""\n
|
|
|
|
No Stata executable found!\n\n
|
|
|
|
If Stata is needed:\n
|
|
|
|
1) Check the settings of your system path.
|
|
|
|
2) Note we are looking for Stata executables called: %s
|
|
|
|
If yours has a different name, please report to hmgaudecker [at] gmail\n
|
|
|
|
Else:\n
|
2012-04-13 18:32:34 +02:00
|
|
|
Do not load the 'run_do_script' tool in the main wscript.\n\n""" % STATA_COMMANDS)
|
2012-04-13 00:48:34 +02:00
|
|
|
ctx.env.STATAFLAGS = STATAFLAGS
|
|
|
|
ctx.env.STATAENCODING = STATAENCODING
|
|
|
|
|
|
|
|
@Task.update_outputs
|
2012-04-13 18:32:34 +02:00
|
|
|
class run_do_script_base(Task.Task):
|
|
|
|
"""Run a Stata do-script from the bldnode directory."""
|
2012-04-13 00:48:34 +02:00
|
|
|
run_str = '"${STATACMD}" ${STATAFLAGS} "${SRC[0].abspath()}" "${DOFILETRUNK}"'
|
|
|
|
shell = True
|
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
class run_do_script(run_do_script_base):
|
|
|
|
"""Use the log file automatically kept by Stata for error-catching.
|
2012-04-13 00:48:34 +02:00
|
|
|
Erase it if the task finished without error. If not, it will show
|
2012-04-13 18:32:34 +02:00
|
|
|
up as do_script.log in the bldnode directory.
|
2012-04-13 00:48:34 +02:00
|
|
|
"""
|
|
|
|
def run(self):
|
2012-04-13 18:32:34 +02:00
|
|
|
run_do_script_base.run(self)
|
2012-04-13 00:48:34 +02:00
|
|
|
ret, log_tail = self.check_erase_log_file()
|
|
|
|
if ret:
|
|
|
|
Logs.error("""Running Stata on %s failed with code %r.\n\nCheck the log file %s, last 10 lines\n\n%s\n\n\n""" % (
|
|
|
|
self.inputs[0].nice_path(), ret, self.env.LOGFILEPATH, log_tail))
|
|
|
|
return ret
|
|
|
|
|
|
|
|
def check_erase_log_file(self):
|
|
|
|
"""Parse Stata's default log file and erase it if everything okay.
|
|
|
|
|
|
|
|
Parser is based on Brendan Halpin's shell script found here:
|
|
|
|
http://teaching.sociology.ul.ie/bhalpin/wordpress/?p=122
|
|
|
|
"""
|
|
|
|
|
|
|
|
if sys.version_info.major >= 3:
|
|
|
|
kwargs = {'file': self.env.LOGFILEPATH, 'mode': 'r', 'encoding': self.env.STATAENCODING}
|
|
|
|
else:
|
|
|
|
kwargs = {'name': self.env.LOGFILEPATH, 'mode': 'r'}
|
|
|
|
|
|
|
|
with open(**kwargs) as log:
|
|
|
|
log_tail = log.readlines()[-10:]
|
|
|
|
for line in log_tail:
|
|
|
|
error_found = re.match("r\(([0-9]+)\)", line)
|
|
|
|
if error_found:
|
|
|
|
return error_found.group(1), ''.join(log_tail)
|
|
|
|
else:
|
|
|
|
pass
|
|
|
|
# Only end up here if the parser did not identify an error.
|
|
|
|
os.remove(self.env.LOGFILEPATH)
|
|
|
|
return None, None
|
|
|
|
|
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
@TaskGen.feature('run_do_script')
|
2012-04-13 00:48:34 +02:00
|
|
|
@TaskGen.before_method('process_source')
|
2012-04-13 18:32:34 +02:00
|
|
|
def apply_run_do_script(tg):
|
2012-04-13 00:48:34 +02:00
|
|
|
"""Task generator customising the options etc. to call Stata in batch
|
2012-04-13 18:32:34 +02:00
|
|
|
mode for running a do-script.
|
2012-04-13 00:48:34 +02:00
|
|
|
"""
|
|
|
|
|
|
|
|
# Convert sources and targets to nodes
|
|
|
|
src_node = tg.path.find_resource(tg.source)
|
|
|
|
tgt_nodes = [tg.path.find_or_declare(t) for t in tg.to_list(tg.target)]
|
|
|
|
|
2012-04-13 18:32:34 +02:00
|
|
|
tsk = tg.create_task('run_do_script', src=src_node, tgt=tgt_nodes)
|
2012-04-13 00:48:34 +02:00
|
|
|
tsk.env.DOFILETRUNK = os.path.splitext(src_node.name)[0]
|
|
|
|
tsk.env.LOGFILEPATH = os.path.join(tg.bld.bldnode.abspath(), '%s.log' % (tsk.env.DOFILETRUNK))
|
|
|
|
|
|
|
|
# dependencies (if the attribute 'deps' changes, trigger a recompilation)
|
|
|
|
for x in tg.to_list(getattr(tg, 'deps', [])):
|
|
|
|
node = tg.path.find_resource(x)
|
|
|
|
if not node:
|
|
|
|
tg.bld.fatal('Could not find dependency %r for running %r' % (x, src_node.nice_path()))
|
|
|
|
tsk.dep_nodes.append(node)
|
|
|
|
Logs.debug('deps: found dependencies %r for running %r' % (tsk.dep_nodes, src_node.nice_path()))
|
|
|
|
|
|
|
|
# Bypass the execution of process_source by setting the source to an empty list
|
|
|
|
tg.source = []
|
|
|
|
|